PyPI - vellum-ai - Versions diffs - 0.3.14__py3-none-any.whl → 0.3.15__py3-none-any.whl - Mend

vellum-ai 0.3.14py3-none-any.whl → 0.3.15py3-none-any.whl

Files changed (318) hide show

vellum/__init__.py +22 -0
vellum/client.py +846 -100
vellum/core/__init__.py +8 -0
vellum/core/client_wrapper.py +27 -8
vellum/core/file.py +38 -0
vellum/core/http_client.py +130 -0
vellum/core/jsonable_encoder.py +2 -2
vellum/core/request_options.py +32 -0
vellum/resources/deployments/client.py +161 -24
vellum/resources/document_indexes/client.py +337 -80
vellum/resources/documents/client.py +278 -58
vellum/resources/folder_entities/client.py +60 -10
vellum/resources/model_versions/client.py +48 -8
vellum/resources/registered_prompts/client.py +52 -6
vellum/resources/sandboxes/client.py +108 -26
vellum/resources/test_suite_runs/client.py +221 -38
vellum/resources/test_suites/client.py +110 -24
vellum/resources/workflow_deployments/client.py +110 -14
vellum/types/__init__.py +20 -0
vellum/types/api_node_result.py +1 -0
vellum/types/api_node_result_data.py +4 -2
vellum/types/array_chat_message_content.py +1 -0
vellum/types/array_chat_message_content_item.py +6 -5
vellum/types/array_chat_message_content_item_request.py +6 -5
vellum/types/array_chat_message_content_request.py +1 -0
vellum/types/array_enum.py +2 -2
vellum/types/array_variable_value_item.py +16 -10
vellum/types/chat_history_enum.py +2 -2
vellum/types/chat_history_input_request.py +6 -1
vellum/types/chat_history_variable_value.py +2 -1
vellum/types/chat_message.py +7 -5
vellum/types/chat_message_content.py +8 -6
vellum/types/chat_message_content_request.py +8 -6
vellum/types/chat_message_request.py +7 -5
vellum/types/code_execution_node_array_result.py +31 -0
vellum/types/code_execution_node_chat_history_result.py +2 -1
vellum/types/code_execution_node_error_result.py +2 -1
vellum/types/code_execution_node_function_call_result.py +31 -0
vellum/types/code_execution_node_json_result.py +2 -1
vellum/types/code_execution_node_number_result.py +2 -1
vellum/types/code_execution_node_result.py +1 -0
vellum/types/code_execution_node_result_data.py +2 -1
vellum/types/code_execution_node_result_output.py +36 -8
vellum/types/code_execution_node_search_results_result.py +2 -1
vellum/types/code_execution_node_string_result.py +2 -1
vellum/types/conditional_node_result.py +1 -0
vellum/types/conditional_node_result_data.py +2 -1
vellum/types/deployment_provider_payload_response.py +1 -0
vellum/types/deployment_read.py +32 -17
vellum/types/document_document_to_document_index.py +21 -15
vellum/types/document_index_read.py +32 -19
vellum/types/document_read.py +34 -24
vellum/types/document_status.py +2 -2
vellum/types/enriched_normalized_completion.py +36 -19
vellum/types/error_enum.py +2 -2
vellum/types/error_variable_value.py +2 -1
vellum/types/execute_prompt_api_error_response.py +5 -1
vellum/types/execute_prompt_event.py +8 -6
vellum/types/execute_prompt_response.py +4 -4
vellum/types/execute_workflow_error_response.py +5 -1
vellum/types/execute_workflow_response.py +3 -2
vellum/types/execute_workflow_stream_error_response.py +5 -1
vellum/types/execute_workflow_workflow_result_event.py +4 -4
vellum/types/execution_array_vellum_value.py +7 -2
vellum/types/execution_chat_history_vellum_value.py +7 -2
vellum/types/execution_error_vellum_value.py +7 -2
vellum/types/execution_function_call_vellum_value.py +7 -2
vellum/types/execution_json_vellum_value.py +7 -2
vellum/types/execution_number_vellum_value.py +7 -2
vellum/types/execution_search_results_vellum_value.py +7 -2
vellum/types/execution_string_vellum_value.py +7 -2
vellum/types/execution_vellum_value.py +16 -10
vellum/types/fulfilled_enum.py +2 -2
vellum/types/fulfilled_execute_prompt_event.py +2 -1
vellum/types/fulfilled_execute_prompt_response.py +12 -5
vellum/types/fulfilled_execute_workflow_workflow_result_event.py +1 -0
vellum/types/fulfilled_function_call.py +2 -1
vellum/types/fulfilled_prompt_execution_meta.py +3 -2
vellum/types/fulfilled_workflow_node_result_event.py +6 -5
vellum/types/function_call.py +4 -4
vellum/types/function_call_chat_message_content.py +1 -0
vellum/types/function_call_chat_message_content_request.py +1 -0
vellum/types/function_call_chat_message_content_value.py +2 -1
vellum/types/function_call_chat_message_content_value_request.py +2 -1
vellum/types/function_call_enum.py +2 -2
vellum/types/function_call_variable_value.py +1 -0
vellum/types/generate_error_response.py +5 -1
vellum/types/generate_options_request.py +8 -5
vellum/types/generate_request.py +15 -9
vellum/types/generate_result.py +10 -6
vellum/types/generate_result_data.py +5 -3
vellum/types/generate_result_error.py +5 -1
vellum/types/generate_stream_response.py +1 -0
vellum/types/generate_stream_result.py +3 -2
vellum/types/generate_stream_result_data.py +1 -0
vellum/types/image_chat_message_content.py +1 -0
vellum/types/image_chat_message_content_request.py +1 -0
vellum/types/image_enum.py +2 -2
vellum/types/image_variable_value.py +2 -1
vellum/types/initiated_enum.py +2 -2
vellum/types/initiated_execute_prompt_event.py +2 -1
vellum/types/initiated_prompt_execution_meta.py +5 -4
vellum/types/initiated_workflow_node_result_event.py +5 -4
vellum/types/json_enum.py +2 -2
vellum/types/json_input_request.py +6 -1
vellum/types/json_variable_value.py +2 -1
vellum/types/logprobs_enum.py +2 -2
vellum/types/metadata_filter_config_request.py +7 -6
vellum/types/metadata_filter_rule_request.py +7 -6
vellum/types/model_version_build_config.py +12 -7
vellum/types/model_version_exec_config.py +18 -11
vellum/types/model_version_exec_config_parameters.py +7 -6
vellum/types/model_version_read.py +51 -32
vellum/types/model_version_sandbox_snapshot.py +17 -4
vellum/types/named_test_case_chat_history_variable_value_request.py +2 -1
vellum/types/named_test_case_error_variable_value_request.py +2 -1
vellum/types/named_test_case_json_variable_value_request.py +2 -1
vellum/types/named_test_case_number_variable_value_request.py +2 -1
vellum/types/named_test_case_search_results_variable_value_request.py +2 -1
vellum/types/named_test_case_string_variable_value_request.py +2 -1
vellum/types/named_test_case_variable_value_request.py +12 -8
vellum/types/node_input_compiled_array_value.py +2 -1
vellum/types/node_input_compiled_chat_history_value.py +2 -1
vellum/types/node_input_compiled_error_value.py +2 -1
vellum/types/node_input_compiled_function_call.py +32 -0
vellum/types/node_input_compiled_json_value.py +2 -1
vellum/types/node_input_compiled_number_value.py +2 -1
vellum/types/node_input_compiled_search_results_value.py +2 -1
vellum/types/node_input_compiled_string_value.py +2 -1
vellum/types/node_input_variable_compiled_value.py +26 -9
vellum/types/node_output_compiled_array_value.py +2 -1
vellum/types/node_output_compiled_chat_history_value.py +2 -1
vellum/types/node_output_compiled_error_value.py +2 -1
vellum/types/node_output_compiled_function_value.py +2 -1
vellum/types/node_output_compiled_json_value.py +2 -1
vellum/types/node_output_compiled_number_value.py +2 -1
vellum/types/node_output_compiled_search_results_value.py +2 -1
vellum/types/node_output_compiled_string_value.py +2 -1
vellum/types/node_output_compiled_value.py +16 -10
vellum/types/normalized_log_probs.py +2 -1
vellum/types/normalized_token_log_probs.py +3 -2
vellum/types/number_enum.py +2 -2
vellum/types/number_variable_value.py +2 -1
vellum/types/paginated_document_index_read_list.py +5 -4
vellum/types/paginated_slim_deployment_read_list.py +5 -4
vellum/types/paginated_slim_document_list.py +5 -4
vellum/types/paginated_slim_workflow_deployment_list.py +5 -4
vellum/types/paginated_test_suite_run_execution_list.py +5 -4
vellum/types/prompt_deployment_expand_meta_request_request.py +25 -15
vellum/types/prompt_deployment_input_request.py +6 -5
vellum/types/prompt_execution_meta.py +6 -5
vellum/types/prompt_node_result.py +1 -0
vellum/types/prompt_node_result_data.py +4 -3
vellum/types/prompt_output.py +8 -6
vellum/types/prompt_template_block.py +1 -0
vellum/types/prompt_template_block_data.py +1 -0
vellum/types/prompt_template_block_data_request.py +1 -0
vellum/types/prompt_template_block_properties.py +11 -10
vellum/types/prompt_template_block_properties_request.py +11 -10
vellum/types/prompt_template_block_request.py +1 -0
vellum/types/raw_prompt_execution_overrides_request.py +11 -5
vellum/types/register_prompt_error_response.py +5 -1
vellum/types/register_prompt_model_parameters_request.py +5 -4
vellum/types/register_prompt_prompt.py +10 -2
vellum/types/register_prompt_prompt_info_request.py +5 -3
vellum/types/register_prompt_response.py +30 -10
vellum/types/registered_prompt_deployment.py +15 -3
vellum/types/registered_prompt_input_variable_request.py +3 -2
vellum/types/registered_prompt_model_version.py +10 -2
vellum/types/registered_prompt_sandbox.py +10 -2
vellum/types/registered_prompt_sandbox_snapshot.py +5 -1
vellum/types/rejected_enum.py +2 -2
vellum/types/rejected_execute_prompt_event.py +2 -1
vellum/types/rejected_execute_prompt_response.py +12 -5
vellum/types/rejected_execute_workflow_workflow_result_event.py +1 -0
vellum/types/rejected_function_call.py +2 -1
vellum/types/rejected_prompt_execution_meta.py +3 -2
vellum/types/rejected_workflow_node_result_event.py +4 -3
vellum/types/sandbox_scenario.py +11 -3
vellum/types/scenario_input.py +4 -3
vellum/types/scenario_input_request.py +4 -3
vellum/types/search_error_response.py +5 -1
vellum/types/search_filters_request.py +10 -6
vellum/types/search_node_result.py +1 -0
vellum/types/search_node_result_data.py +7 -4
vellum/types/search_request_options_request.py +20 -8
vellum/types/search_response.py +5 -3
vellum/types/search_result.py +15 -5
vellum/types/search_result_document.py +20 -8
vellum/types/search_result_document_request.py +15 -7
vellum/types/search_result_merging_request.py +5 -1
vellum/types/search_result_request.py +15 -5
vellum/types/search_results_enum.py +2 -2
vellum/types/search_results_variable_value.py +2 -1
vellum/types/search_weights_request.py +10 -4
vellum/types/slim_deployment_read.py +28 -14
vellum/types/slim_document.py +56 -35
vellum/types/slim_workflow_deployment.py +37 -24
vellum/types/streaming_enum.py +2 -2
vellum/types/streaming_execute_prompt_event.py +6 -4
vellum/types/streaming_prompt_execution_meta.py +2 -1
vellum/types/streaming_workflow_node_result_event.py +6 -5
vellum/types/string_chat_message_content.py +1 -0
vellum/types/string_chat_message_content_request.py +1 -0
vellum/types/string_enum.py +2 -2
vellum/types/string_input_request.py +6 -1
vellum/types/string_variable_value.py +2 -1
vellum/types/submit_completion_actual_request.py +25 -13
vellum/types/submit_completion_actuals_error_response.py +1 -0
vellum/types/submit_workflow_execution_actual_request.py +6 -5
vellum/types/subworkflow_enum.py +2 -2
vellum/types/subworkflow_node_result.py +1 -0
vellum/types/templating_node_array_result.py +31 -0
vellum/types/templating_node_chat_history_result.py +2 -1
vellum/types/templating_node_error_result.py +2 -1
vellum/types/templating_node_function_call_result.py +31 -0
vellum/types/templating_node_json_result.py +2 -1
vellum/types/templating_node_number_result.py +2 -1
vellum/types/templating_node_result.py +1 -0
vellum/types/templating_node_result_data.py +1 -0
vellum/types/templating_node_result_output.py +36 -8
vellum/types/templating_node_search_results_result.py +2 -1
vellum/types/templating_node_string_result.py +2 -1
vellum/types/terminal_node_array_result.py +8 -3
vellum/types/terminal_node_chat_history_result.py +8 -3
vellum/types/terminal_node_error_result.py +8 -3
vellum/types/terminal_node_function_call_result.py +8 -3
vellum/types/terminal_node_json_result.py +8 -3
vellum/types/terminal_node_number_result.py +8 -3
vellum/types/terminal_node_result.py +1 -0
vellum/types/terminal_node_result_data.py +1 -0
vellum/types/terminal_node_result_output.py +16 -10
vellum/types/terminal_node_search_results_result.py +8 -3
vellum/types/terminal_node_string_result.py +8 -3
vellum/types/test_case_chat_history_variable_value.py +2 -1
vellum/types/test_case_error_variable_value.py +2 -1
vellum/types/test_case_json_variable_value.py +2 -1
vellum/types/test_case_number_variable_value.py +2 -1
vellum/types/test_case_search_results_variable_value.py +2 -1
vellum/types/test_case_string_variable_value.py +2 -1
vellum/types/test_case_variable_value.py +12 -8
vellum/types/test_suite_run_deployment_release_tag_exec_config.py +5 -3
vellum/types/test_suite_run_deployment_release_tag_exec_config_data.py +10 -4
vellum/types/test_suite_run_deployment_release_tag_exec_config_data_request.py +10 -4
vellum/types/test_suite_run_deployment_release_tag_exec_config_request.py +5 -3
vellum/types/test_suite_run_deployment_release_tag_exec_config_type_enum.py +2 -2
vellum/types/test_suite_run_exec_config.py +4 -4
vellum/types/test_suite_run_exec_config_request.py +4 -4
vellum/types/test_suite_run_execution.py +1 -0
vellum/types/test_suite_run_execution_chat_history_output.py +2 -1
vellum/types/test_suite_run_execution_error_output.py +2 -1
vellum/types/test_suite_run_execution_json_output.py +2 -1
vellum/types/test_suite_run_execution_metric_result.py +1 -0
vellum/types/test_suite_run_execution_number_output.py +2 -1
vellum/types/test_suite_run_execution_output.py +12 -8
vellum/types/test_suite_run_execution_search_results_output.py +2 -1
vellum/types/test_suite_run_execution_string_output.py +2 -1
vellum/types/test_suite_run_metric_error_output.py +1 -0
vellum/types/test_suite_run_metric_error_output_type_enum.py +2 -2
vellum/types/test_suite_run_metric_number_output.py +1 -0
vellum/types/test_suite_run_metric_number_output_type_enum.py +2 -2
vellum/types/test_suite_run_metric_output.py +4 -4
vellum/types/test_suite_run_read.py +16 -14
vellum/types/test_suite_run_test_suite.py +1 -0
vellum/types/test_suite_run_workflow_release_tag_exec_config.py +5 -3
vellum/types/test_suite_run_workflow_release_tag_exec_config_data.py +10 -6
vellum/types/test_suite_run_workflow_release_tag_exec_config_data_request.py +10 -6
vellum/types/test_suite_run_workflow_release_tag_exec_config_request.py +5 -3
vellum/types/test_suite_run_workflow_release_tag_exec_config_type_enum.py +2 -2
vellum/types/test_suite_test_case.py +3 -2
vellum/types/upload_document_error_response.py +1 -0
vellum/types/upload_document_response.py +5 -1
vellum/types/vellum_error.py +1 -0
vellum/types/vellum_error_request.py +1 -0
vellum/types/vellum_image.py +2 -1
vellum/types/vellum_image_request.py +2 -1
vellum/types/vellum_variable.py +1 -0
vellum/types/workflow_deployment_read.py +37 -24
vellum/types/workflow_event_error.py +1 -0
vellum/types/workflow_execution_actual_chat_history_request.py +25 -15
vellum/types/workflow_execution_actual_json_request.py +25 -15
vellum/types/workflow_execution_actual_string_request.py +25 -15
vellum/types/workflow_execution_node_result_event.py +3 -2
vellum/types/workflow_execution_workflow_result_event.py +3 -2
vellum/types/workflow_node_result_data.py +16 -10
vellum/types/workflow_node_result_event.py +8 -6
vellum/types/workflow_output.py +18 -11
vellum/types/workflow_output_array.py +7 -2
vellum/types/workflow_output_chat_history.py +7 -2
vellum/types/workflow_output_error.py +7 -2
vellum/types/workflow_output_function_call.py +7 -2
vellum/types/workflow_output_image.py +7 -2
vellum/types/workflow_output_json.py +7 -2
vellum/types/workflow_output_number.py +7 -2
vellum/types/workflow_output_search_results.py +7 -2
vellum/types/workflow_output_string.py +7 -2
vellum/types/workflow_request_chat_history_input_request.py +6 -1
vellum/types/workflow_request_input_request.py +8 -6
vellum/types/workflow_request_json_input_request.py +6 -1
vellum/types/workflow_request_number_input_request.py +6 -1
vellum/types/workflow_request_string_input_request.py +6 -1
vellum/types/workflow_result_event.py +5 -4
vellum/types/workflow_result_event_output_data.py +16 -10
vellum/types/workflow_result_event_output_data_array.py +8 -5
vellum/types/workflow_result_event_output_data_chat_history.py +8 -5
vellum/types/workflow_result_event_output_data_error.py +8 -5
vellum/types/workflow_result_event_output_data_function_call.py +8 -5
vellum/types/workflow_result_event_output_data_json.py +8 -5
vellum/types/workflow_result_event_output_data_number.py +8 -5
vellum/types/workflow_result_event_output_data_search_results.py +8 -5
vellum/types/workflow_result_event_output_data_string.py +11 -7
vellum/types/workflow_stream_event.py +4 -4
vellum/version.py +4 -0
{vellum_ai-0.3.14.dist-info → vellum_ai-0.3.15.dist-info}/METADATA +4 -4
vellum_ai-0.3.15.dist-info/RECORD +365 -0
vellum_ai-0.3.14.dist-info/RECORD +0 -356
{vellum_ai-0.3.14.dist-info → vellum_ai-0.3.15.dist-info}/LICENSE +0 -0
{vellum_ai-0.3.14.dist-info → vellum_ai-0.3.15.dist-info}/WHEEL +0 -0

vellum/core/__init__.py CHANGED Viewed

@@ -3,14 +3,22 @@
 from .api_error import ApiError
 from .client_wrapper import AsyncClientWrapper, BaseClientWrapper, SyncClientWrapper
 from .datetime_utils import serialize_datetime
+from .file import File, convert_file_dict_to_httpx_tuples
+from .http_client import AsyncHttpClient, HttpClient
 from .jsonable_encoder import jsonable_encoder
 from .remove_none_from_dict import remove_none_from_dict
+from .request_options import RequestOptions
 __all__ = [
     "ApiError",
     "AsyncClientWrapper",
+    "AsyncHttpClient",
     "BaseClientWrapper",
+    "File",
+    "HttpClient",
+    "RequestOptions",
     "SyncClientWrapper",
+    "convert_file_dict_to_httpx_tuples",
     "jsonable_encoder",
     "remove_none_from_dict",
     "serialize_datetime",

vellum/core/client_wrapper.py CHANGED Viewed

@@ -5,18 +5,20 @@ import typing
 import httpx
 from ..environment import VellumEnvironment
+from .http_client import AsyncHttpClient, HttpClient
 class BaseClientWrapper:
-    def __init__(self, *, api_key: str, environment: VellumEnvironment):
+    def __init__(self, *, api_key: str, environment: VellumEnvironment, timeout: typing.Optional[float] = None):
         self.api_key = api_key
         self._environment = environment
+        self._timeout = timeout
     def get_headers(self) -> typing.Dict[str, str]:
         headers: typing.Dict[str, str] = {
             "X-Fern-Language": "Python",
             "X-Fern-SDK-Name": "vellum-ai",
-            "X-Fern-SDK-Version": "0.3.14",
+            "X-Fern-SDK-Version": "0.3.15",
         }
         headers["X_API_KEY"] = self.api_key
         return headers
@@ -24,14 +26,31 @@ class BaseClientWrapper:
     def get_environment(self) -> VellumEnvironment:
         return self._environment
+    def get_timeout(self) -> typing.Optional[float]:
+        return self._timeout
 class SyncClientWrapper(BaseClientWrapper):
-    def __init__(self, *, api_key: str, environment: VellumEnvironment, httpx_client: httpx.Client):
-        super().__init__(api_key=api_key, environment=environment)
-        self.httpx_client = httpx_client
+    def __init__(
+        self,
+        *,
+        api_key: str,
+        environment: VellumEnvironment,
+        timeout: typing.Optional[float] = None,
+        httpx_client: httpx.Client
+    ):
+        super().__init__(api_key=api_key, environment=environment, timeout=timeout)
+        self.httpx_client = HttpClient(httpx_client=httpx_client)
 class AsyncClientWrapper(BaseClientWrapper):
-    def __init__(self, *, api_key: str, environment: VellumEnvironment, httpx_client: httpx.AsyncClient):
-        super().__init__(api_key=api_key, environment=environment)
-        self.httpx_client = httpx_client
+    def __init__(
+        self,
+        *,
+        api_key: str,
+        environment: VellumEnvironment,
+        timeout: typing.Optional[float] = None,
+        httpx_client: httpx.AsyncClient
+    ):
+        super().__init__(api_key=api_key, environment=environment, timeout=timeout)
+        self.httpx_client = AsyncHttpClient(httpx_client=httpx_client)

vellum/core/file.py ADDED Viewed

@@ -0,0 +1,38 @@
+# This file was auto-generated by Fern from our API Definition.
+import typing
+# File typing inspired by the flexibility of types within the httpx library
+# https://github.com/encode/httpx/blob/master/httpx/_types.py
+FileContent = typing.Union[typing.IO[bytes], bytes, str]
+File = typing.Union[
+    # file (or bytes)
+    FileContent,
+    # (filename, file (or bytes))
+    typing.Tuple[typing.Optional[str], FileContent],
+    # (filename, file (or bytes), content_type)
+    typing.Tuple[typing.Optional[str], FileContent, typing.Optional[str]],
+    # (filename, file (or bytes), content_type, headers)
+    typing.Tuple[typing.Optional[str], FileContent, typing.Optional[str], typing.Mapping[str, str]],
+]
+def convert_file_dict_to_httpx_tuples(
+    d: typing.Dict[str, typing.Union[File, typing.List[File]]]
+) -> typing.List[typing.Tuple[str, File]]:
+    """
+    The format we use is a list of tuples, where the first element is the
+    name of the file and the second is the file object. Typically HTTPX wants
+    a dict, but to be able to send lists of files, you have to use the list
+    approach (which also works for non-lists)
+    https://github.com/encode/httpx/pull/1032
+    """
+    httpx_tuples = []
+    for key, file_like in d.items():
+        if isinstance(file_like, list):
+            for file_like_item in file_like:
+                httpx_tuples.append((key, file_like_item))
+        else:
+            httpx_tuples.append((key, file_like))
+    return httpx_tuples

vellum/core/http_client.py ADDED Viewed

@@ -0,0 +1,130 @@
+# This file was auto-generated by Fern from our API Definition.
+import asyncio
+import email.utils
+import re
+import time
+import typing
+from contextlib import asynccontextmanager, contextmanager
+from functools import wraps
+from random import random
+import httpx
+INITIAL_RETRY_DELAY_SECONDS = 0.5
+MAX_RETRY_DELAY_SECONDS = 10
+MAX_RETRY_DELAY_SECONDS_FROM_HEADER = 30
+def _parse_retry_after(response_headers: httpx.Headers) -> typing.Optional[float]:
+    """
+    This function parses the `Retry-After` header in a HTTP response and returns the number of seconds to wait.
+    Inspired by the urllib3 retry implementation.
+    """
+    retry_after_ms = response_headers.get("retry-after-ms")
+    if retry_after_ms is not None:
+        try:
+            return int(retry_after_ms) / 1000 if retry_after_ms > 0 else 0
+        except Exception:
+            pass
+    retry_after = response_headers.get("retry-after")
+    if retry_after is None:
+        return None
+    # Attempt to parse the header as an int.
+    if re.match(r"^\s*[0-9]+\s*$", retry_after):
+        seconds = float(retry_after)
+    # Fallback to parsing it as a date.
+    else:
+        retry_date_tuple = email.utils.parsedate_tz(retry_after)
+        if retry_date_tuple is None:
+            return None
+        if retry_date_tuple[9] is None:  # Python 2
+            # Assume UTC if no timezone was specified
+            # On Python2.7, parsedate_tz returns None for a timezone offset
+            # instead of 0 if no timezone is given, where mktime_tz treats
+            # a None timezone offset as local time.
+            retry_date_tuple = retry_date_tuple[:9] + (0,) + retry_date_tuple[10:]
+        retry_date = email.utils.mktime_tz(retry_date_tuple)
+        seconds = retry_date - time.time()
+    if seconds < 0:
+        seconds = 0
+    return seconds
+def _retry_timeout(response: httpx.Response, retries: int) -> float:
+    """
+    Determine the amount of time to wait before retrying a request.
+    This function begins by trying to parse a retry-after header from the response, and then proceeds to use exponential backoff
+    with a jitter to determine the number of seconds to wait.
+    """
+    # If the API asks us to wait a certain amount of time (and it's a reasonable amount), just do what it says.
+    retry_after = _parse_retry_after(response.headers)
+    if retry_after is not None and retry_after <= MAX_RETRY_DELAY_SECONDS_FROM_HEADER:
+        return retry_after
+    # Apply exponential backoff, capped at MAX_RETRY_DELAY_SECONDS.
+    retry_delay = min(INITIAL_RETRY_DELAY_SECONDS * pow(2.0, retries), MAX_RETRY_DELAY_SECONDS)
+    # Add a randomness / jitter to the retry delay to avoid overwhelming the server with retries.
+    timeout = retry_delay * (1 - 0.25 * random())
+    return timeout if timeout >= 0 else 0
+def _should_retry(response: httpx.Response) -> bool:
+    retriable_400s = [429, 408, 409]
+    return response.status_code >= 500 or response.status_code in retriable_400s
+class HttpClient:
+    def __init__(self, *, httpx_client: httpx.Client):
+        self.httpx_client = httpx_client
+    # Ensure that the signature of the `request` method is the same as the `httpx.Client.request` method
+    @wraps(httpx.Client.request)
+    def request(
+        self, *args: typing.Any, max_retries: int = 0, retries: int = 0, **kwargs: typing.Any
+    ) -> httpx.Response:
+        response = self.httpx_client.request(*args, **kwargs)
+        if _should_retry(response=response):
+            if max_retries > retries:
+                time.sleep(_retry_timeout(response=response, retries=retries))
+                return self.request(max_retries=max_retries, retries=retries + 1, *args, **kwargs)
+        return response
+    @wraps(httpx.Client.stream)
+    @contextmanager
+    def stream(self, *args: typing.Any, max_retries: int = 0, retries: int = 0, **kwargs: typing.Any) -> typing.Any:
+        with self.httpx_client.stream(*args, **kwargs) as stream:
+            yield stream
+class AsyncHttpClient:
+    def __init__(self, *, httpx_client: httpx.AsyncClient):
+        self.httpx_client = httpx_client
+    # Ensure that the signature of the `request` method is the same as the `httpx.Client.request` method
+    @wraps(httpx.AsyncClient.request)
+    async def request(
+        self, *args: typing.Any, max_retries: int = 0, retries: int = 0, **kwargs: typing.Any
+    ) -> httpx.Response:
+        response = await self.httpx_client.request(*args, **kwargs)
+        if _should_retry(response=response):
+            if max_retries > retries:
+                await asyncio.sleep(_retry_timeout(response=response, retries=retries))
+                return await self.request(max_retries=max_retries, retries=retries + 1, *args, **kwargs)
+        return response
+    @wraps(httpx.AsyncClient.stream)
+    @asynccontextmanager
+    async def stream(
+        self, *args: typing.Any, max_retries: int = 0, retries: int = 0, **kwargs: typing.Any
+    ) -> typing.Any:
+        async with self.httpx_client.stream(*args, **kwargs) as stream:
+            yield stream

vellum/core/jsonable_encoder.py CHANGED Viewed

@@ -65,10 +65,10 @@ def jsonable_encoder(obj: Any, custom_encoder: Optional[Dict[Any, Callable[[Any]
         return str(obj)
     if isinstance(obj, (str, int, float, type(None))):
         return obj
-    if isinstance(obj, dt.date):
-        return str(obj)
     if isinstance(obj, dt.datetime):
         return serialize_datetime(obj)
+    if isinstance(obj, dt.date):
+        return str(obj)
     if isinstance(obj, dict):
         encoded_dict = {}
         allowed_keys = set(obj.keys())

vellum/core/request_options.py ADDED Viewed

@@ -0,0 +1,32 @@
+# This file was auto-generated by Fern from our API Definition.
+import typing
+try:
+    from typing import NotRequired  # type: ignore
+except ImportError:
+    from typing_extensions import NotRequired  # type: ignore
+class RequestOptions(typing.TypedDict):
+    """
+    Additional options for request-specific configuration when calling APIs via the SDK.
+    This is used primarily as an optional final parameter for service functions.
+    Attributes:
+        - timeout_in_seconds: int. The number of seconds to await an API call before timing out.
+        - max_retries: int. The max number of retries to attempt if the API call fails.
+        - additional_headers: typing.Dict[str, typing.Any]. A dictionary containing additional parameters to spread into the request's header dict
+        - additional_query_parameters: typing.Dict[str, typing.Any]. A dictionary containing additional parameters to spread into the request's query parameters dict
+        - additional_body_parameters: typing.Dict[str, typing.Any]. A dictionary containing additional parameters to spread into the request's body parameters dict
+    """
+    timeout_in_seconds: NotRequired[int]
+    max_retries: NotRequired[int]
+    additional_headers: NotRequired[typing.Dict[str, typing.Any]]
+    additional_query_parameters: NotRequired[typing.Dict[str, typing.Any]]
+    additional_body_parameters: NotRequired[typing.Dict[str, typing.Any]]

vellum/resources/deployments/client.py CHANGED Viewed

@@ -8,6 +8,7 @@ from ...core.api_error import ApiError
 from ...core.client_wrapper import AsyncClientWrapper, SyncClientWrapper
 from ...core.jsonable_encoder import jsonable_encoder
 from ...core.remove_none_from_dict import remove_none_from_dict
+from ...core.request_options import RequestOptions
 from ...errors.bad_request_error import BadRequestError
 from ...errors.forbidden_error import ForbiddenError
 from ...errors.internal_server_error import InternalServerError
@@ -38,6 +39,7 @@ class DeploymentsClient:
         offset: typing.Optional[int] = None,
         ordering: typing.Optional[str] = None,
         status: typing.Optional[DeploymentsListRequestStatus] = None,
+        request_options: typing.Optional[RequestOptions] = None,
     ) -> PaginatedSlimDeploymentReadList:
         """
         Parameters:
@@ -48,6 +50,8 @@ class DeploymentsClient:
             - ordering: typing.Optional[str]. Which field to use when ordering the results.
             - status: typing.Optional[DeploymentsListRequestStatus]. status
+            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
         ---
         from vellum.client import Vellum
@@ -59,9 +63,34 @@ class DeploymentsClient:
         _response = self._client_wrapper.httpx_client.request(
             "GET",
             urllib.parse.urljoin(f"{self._client_wrapper.get_environment().default}/", "v1/deployments"),
-            params=remove_none_from_dict({"limit": limit, "offset": offset, "ordering": ordering, "status": status}),
-            headers=self._client_wrapper.get_headers(),
-            timeout=None,
+            params=jsonable_encoder(
+                remove_none_from_dict(
+                    {
+                        "limit": limit,
+                        "offset": offset,
+                        "ordering": ordering,
+                        "status": status,
+                        **(
+                            request_options.get("additional_query_parameters", {})
+                            if request_options is not None
+                            else {}
+                        ),
+                    }
+                )
+            ),
+            headers=jsonable_encoder(
+                remove_none_from_dict(
+                    {
+                        **self._client_wrapper.get_headers(),
+                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
+                    }
+                )
+            ),
+            timeout=request_options.get("timeout_in_seconds")
+            if request_options is not None and request_options.get("timeout_in_seconds") is not None
+            else self._client_wrapper.get_timeout(),
+            retries=0,
+            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
         )
         if 200 <= _response.status_code < 300:
             return pydantic.parse_obj_as(PaginatedSlimDeploymentReadList, _response.json())  # type: ignore
@@ -71,12 +100,14 @@ class DeploymentsClient:
             raise ApiError(status_code=_response.status_code, body=_response.text)
         raise ApiError(status_code=_response.status_code, body=_response_json)
-    def retrieve(self, id: str) -> DeploymentRead:
+    def retrieve(self, id: str, *, request_options: typing.Optional[RequestOptions] = None) -> DeploymentRead:
         """
         Used to retrieve a deployment given its ID or name.
         Parameters:
             - id: str. Either the Deployment's ID or its unique name
+            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
         ---
         from vellum.client import Vellum
@@ -89,9 +120,25 @@ class DeploymentsClient:
         """
         _response = self._client_wrapper.httpx_client.request(
             "GET",
-            urllib.parse.urljoin(f"{self._client_wrapper.get_environment().default}/", f"v1/deployments/{id}"),
-            headers=self._client_wrapper.get_headers(),
-            timeout=None,
+            urllib.parse.urljoin(
+                f"{self._client_wrapper.get_environment().default}/", f"v1/deployments/{jsonable_encoder(id)}"
+            ),
+            params=jsonable_encoder(
+                request_options.get("additional_query_parameters") if request_options is not None else None
+            ),
+            headers=jsonable_encoder(
+                remove_none_from_dict(
+                    {
+                        **self._client_wrapper.get_headers(),
+                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
+                    }
+                )
+            ),
+            timeout=request_options.get("timeout_in_seconds")
+            if request_options is not None and request_options.get("timeout_in_seconds") is not None
+            else self._client_wrapper.get_timeout(),
+            retries=0,
+            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
         )
         if 200 <= _response.status_code < 300:
             return pydantic.parse_obj_as(DeploymentRead, _response.json())  # type: ignore
@@ -106,8 +153,9 @@ class DeploymentsClient:
         *,
         deployment_id: typing.Optional[str] = OMIT,
         deployment_name: typing.Optional[str] = OMIT,
-        inputs: typing.List[PromptDeploymentInputRequest],
+        inputs: typing.Sequence[PromptDeploymentInputRequest],
         release_tag: typing.Optional[str] = OMIT,
+        request_options: typing.Optional[RequestOptions] = None,
     ) -> DeploymentProviderPayloadResponse:
         """
         Parameters:
@@ -115,9 +163,11 @@ class DeploymentsClient:
             - deployment_name: typing.Optional[str]. The name of the deployment. Must provide either this or deployment_id.
-            - inputs: typing.List[PromptDeploymentInputRequest]. The list of inputs defined in the Prompt's deployment with their corresponding values.
+            - inputs: typing.Sequence[PromptDeploymentInputRequest]. The list of inputs defined in the Prompt's deployment with their corresponding values.
             - release_tag: typing.Optional[str]. Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
+            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
         ---
         from vellum.client import Vellum
@@ -140,9 +190,28 @@ class DeploymentsClient:
             urllib.parse.urljoin(
                 f"{self._client_wrapper.get_environment().default}/", "v1/deployments/provider-payload"
             ),
-            json=jsonable_encoder(_request),
-            headers=self._client_wrapper.get_headers(),
-            timeout=None,
+            params=jsonable_encoder(
+                request_options.get("additional_query_parameters") if request_options is not None else None
+            ),
+            json=jsonable_encoder(_request)
+            if request_options is None or request_options.get("additional_body_parameters") is None
+            else {
+                **jsonable_encoder(_request),
+                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            },
+            headers=jsonable_encoder(
+                remove_none_from_dict(
+                    {
+                        **self._client_wrapper.get_headers(),
+                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
+                    }
+                )
+            ),
+            timeout=request_options.get("timeout_in_seconds")
+            if request_options is not None and request_options.get("timeout_in_seconds") is not None
+            else self._client_wrapper.get_timeout(),
+            retries=0,
+            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
         )
         if 200 <= _response.status_code < 300:
             return pydantic.parse_obj_as(DeploymentProviderPayloadResponse, _response.json())  # type: ignore
@@ -172,6 +241,7 @@ class AsyncDeploymentsClient:
         offset: typing.Optional[int] = None,
         ordering: typing.Optional[str] = None,
         status: typing.Optional[DeploymentsListRequestStatus] = None,
+        request_options: typing.Optional[RequestOptions] = None,
     ) -> PaginatedSlimDeploymentReadList:
         """
         Parameters:
@@ -182,6 +252,8 @@ class AsyncDeploymentsClient:
             - ordering: typing.Optional[str]. Which field to use when ordering the results.
             - status: typing.Optional[DeploymentsListRequestStatus]. status
+            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
         ---
         from vellum.client import AsyncVellum
@@ -193,9 +265,34 @@ class AsyncDeploymentsClient:
         _response = await self._client_wrapper.httpx_client.request(
             "GET",
             urllib.parse.urljoin(f"{self._client_wrapper.get_environment().default}/", "v1/deployments"),
-            params=remove_none_from_dict({"limit": limit, "offset": offset, "ordering": ordering, "status": status}),
-            headers=self._client_wrapper.get_headers(),
-            timeout=None,
+            params=jsonable_encoder(
+                remove_none_from_dict(
+                    {
+                        "limit": limit,
+                        "offset": offset,
+                        "ordering": ordering,
+                        "status": status,
+                        **(
+                            request_options.get("additional_query_parameters", {})
+                            if request_options is not None
+                            else {}
+                        ),
+                    }
+                )
+            ),
+            headers=jsonable_encoder(
+                remove_none_from_dict(
+                    {
+                        **self._client_wrapper.get_headers(),
+                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
+                    }
+                )
+            ),
+            timeout=request_options.get("timeout_in_seconds")
+            if request_options is not None and request_options.get("timeout_in_seconds") is not None
+            else self._client_wrapper.get_timeout(),
+            retries=0,
+            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
         )
         if 200 <= _response.status_code < 300:
             return pydantic.parse_obj_as(PaginatedSlimDeploymentReadList, _response.json())  # type: ignore
@@ -205,12 +302,14 @@ class AsyncDeploymentsClient:
             raise ApiError(status_code=_response.status_code, body=_response.text)
         raise ApiError(status_code=_response.status_code, body=_response_json)
-    async def retrieve(self, id: str) -> DeploymentRead:
+    async def retrieve(self, id: str, *, request_options: typing.Optional[RequestOptions] = None) -> DeploymentRead:
         """
         Used to retrieve a deployment given its ID or name.
         Parameters:
             - id: str. Either the Deployment's ID or its unique name
+            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
         ---
         from vellum.client import AsyncVellum
@@ -223,9 +322,25 @@ class AsyncDeploymentsClient:
         """
         _response = await self._client_wrapper.httpx_client.request(
             "GET",
-            urllib.parse.urljoin(f"{self._client_wrapper.get_environment().default}/", f"v1/deployments/{id}"),
-            headers=self._client_wrapper.get_headers(),
-            timeout=None,
+            urllib.parse.urljoin(
+                f"{self._client_wrapper.get_environment().default}/", f"v1/deployments/{jsonable_encoder(id)}"
+            ),
+            params=jsonable_encoder(
+                request_options.get("additional_query_parameters") if request_options is not None else None
+            ),
+            headers=jsonable_encoder(
+                remove_none_from_dict(
+                    {
+                        **self._client_wrapper.get_headers(),
+                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
+                    }
+                )
+            ),
+            timeout=request_options.get("timeout_in_seconds")
+            if request_options is not None and request_options.get("timeout_in_seconds") is not None
+            else self._client_wrapper.get_timeout(),
+            retries=0,
+            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
         )
         if 200 <= _response.status_code < 300:
             return pydantic.parse_obj_as(DeploymentRead, _response.json())  # type: ignore
@@ -240,8 +355,9 @@ class AsyncDeploymentsClient:
         *,
         deployment_id: typing.Optional[str] = OMIT,
         deployment_name: typing.Optional[str] = OMIT,
-        inputs: typing.List[PromptDeploymentInputRequest],
+        inputs: typing.Sequence[PromptDeploymentInputRequest],
         release_tag: typing.Optional[str] = OMIT,
+        request_options: typing.Optional[RequestOptions] = None,
     ) -> DeploymentProviderPayloadResponse:
         """
         Parameters:
@@ -249,9 +365,11 @@ class AsyncDeploymentsClient:
             - deployment_name: typing.Optional[str]. The name of the deployment. Must provide either this or deployment_id.
-            - inputs: typing.List[PromptDeploymentInputRequest]. The list of inputs defined in the Prompt's deployment with their corresponding values.
+            - inputs: typing.Sequence[PromptDeploymentInputRequest]. The list of inputs defined in the Prompt's deployment with their corresponding values.
             - release_tag: typing.Optional[str]. Optionally specify a release tag if you want to pin to a specific release of the Workflow Deployment
+            - request_options: typing.Optional[RequestOptions]. Request-specific configuration.
         ---
         from vellum.client import AsyncVellum
@@ -274,9 +392,28 @@ class AsyncDeploymentsClient:
             urllib.parse.urljoin(
                 f"{self._client_wrapper.get_environment().default}/", "v1/deployments/provider-payload"
             ),
-            json=jsonable_encoder(_request),
-            headers=self._client_wrapper.get_headers(),
-            timeout=None,
+            params=jsonable_encoder(
+                request_options.get("additional_query_parameters") if request_options is not None else None
+            ),
+            json=jsonable_encoder(_request)
+            if request_options is None or request_options.get("additional_body_parameters") is None
+            else {
+                **jsonable_encoder(_request),
+                **(jsonable_encoder(remove_none_from_dict(request_options.get("additional_body_parameters", {})))),
+            },
+            headers=jsonable_encoder(
+                remove_none_from_dict(
+                    {
+                        **self._client_wrapper.get_headers(),
+                        **(request_options.get("additional_headers", {}) if request_options is not None else {}),
+                    }
+                )
+            ),
+            timeout=request_options.get("timeout_in_seconds")
+            if request_options is not None and request_options.get("timeout_in_seconds") is not None
+            else self._client_wrapper.get_timeout(),
+            retries=0,
+            max_retries=request_options.get("max_retries") if request_options is not None else 0,  # type: ignore
         )
         if 200 <= _response.status_code < 300:
             return pydantic.parse_obj_as(DeploymentProviderPayloadResponse, _response.json())  # type: ignore

vellum-ai 0.3.14__py3-none-any.whl → 0.3.15__py3-none-any.whl

vellum-ai 0.3.14py3-none-any.whl → 0.3.15py3-none-any.whl