PyPI - orq-ai-sdk - Versions diffs - 4.2.0rc49__py3-none-any.whl → 4.2.15__py3-none-any.whl - Mend

orq-ai-sdk 4.2.0rc49py3-none-any.whl → 4.2.15py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (104) hide show

orq_ai_sdk/_hooks/globalhook.py +0 -1
orq_ai_sdk/_version.py +3 -3
orq_ai_sdk/agents.py +186 -186
orq_ai_sdk/audio.py +30 -0
orq_ai_sdk/chat.py +22 -0
orq_ai_sdk/completions.py +438 -0
orq_ai_sdk/contacts.py +43 -886
orq_ai_sdk/deployments.py +61 -0
orq_ai_sdk/edits.py +364 -0
orq_ai_sdk/embeddings.py +344 -0
orq_ai_sdk/generations.py +370 -0
orq_ai_sdk/images.py +28 -0
orq_ai_sdk/models/__init__.py +3839 -424
orq_ai_sdk/models/conversationresponse.py +1 -1
orq_ai_sdk/models/conversationwithmessagesresponse.py +1 -1
orq_ai_sdk/models/createagentrequestop.py +768 -12
orq_ai_sdk/models/createagentresponse.py +68 -2
orq_ai_sdk/models/createchatcompletionop.py +538 -313
orq_ai_sdk/models/createcompletionop.py +2078 -0
orq_ai_sdk/models/createcontactop.py +5 -10
orq_ai_sdk/models/createconversationop.py +1 -1
orq_ai_sdk/models/createconversationresponseop.py +2 -2
orq_ai_sdk/models/createdatasetitemop.py +4 -4
orq_ai_sdk/models/createdatasetop.py +1 -1
orq_ai_sdk/models/createdatasourceop.py +1 -1
orq_ai_sdk/models/createembeddingop.py +579 -0
orq_ai_sdk/models/createevalop.py +14 -14
orq_ai_sdk/models/createidentityop.py +1 -1
orq_ai_sdk/models/createimageeditop.py +715 -0
orq_ai_sdk/models/createimageop.py +228 -82
orq_ai_sdk/models/createimagevariationop.py +706 -0
orq_ai_sdk/models/creatememoryop.py +4 -2
orq_ai_sdk/models/createmoderationop.py +521 -0
orq_ai_sdk/models/createpromptop.py +375 -6
orq_ai_sdk/models/creatererankop.py +608 -0
orq_ai_sdk/models/createresponseop.py +2567 -0
orq_ai_sdk/models/createspeechop.py +466 -0
orq_ai_sdk/models/createtoolop.py +6 -6
orq_ai_sdk/models/createtranscriptionop.py +732 -0
orq_ai_sdk/models/createtranslationop.py +702 -0
orq_ai_sdk/models/deploymentgetconfigop.py +17 -7
orq_ai_sdk/models/deploymentsop.py +1 -0
orq_ai_sdk/models/deploymentstreamop.py +7 -0
orq_ai_sdk/models/filegetop.py +1 -1
orq_ai_sdk/models/filelistop.py +1 -1
orq_ai_sdk/models/fileuploadop.py +1 -1
orq_ai_sdk/models/generateconversationnameop.py +1 -1
orq_ai_sdk/models/getallmemoriesop.py +4 -2
orq_ai_sdk/models/getallpromptsop.py +188 -3
orq_ai_sdk/models/getalltoolsop.py +6 -6
orq_ai_sdk/models/getevalsop.py +17 -17
orq_ai_sdk/models/getonepromptop.py +188 -3
orq_ai_sdk/models/getpromptversionop.py +188 -3
orq_ai_sdk/models/invokedeploymentrequest.py +11 -4
orq_ai_sdk/models/listagentsop.py +372 -0
orq_ai_sdk/models/listdatasetdatapointsop.py +4 -4
orq_ai_sdk/models/listdatasetsop.py +1 -1
orq_ai_sdk/models/listdatasourcesop.py +1 -1
orq_ai_sdk/models/listidentitiesop.py +1 -1
orq_ai_sdk/models/listmodelsop.py +1 -0
orq_ai_sdk/models/listpromptversionsop.py +188 -3
orq_ai_sdk/models/partdoneevent.py +1 -1
orq_ai_sdk/models/post_v2_router_ocrop.py +408 -0
orq_ai_sdk/models/publiccontact.py +9 -3
orq_ai_sdk/models/publicidentity.py +62 -0
orq_ai_sdk/models/reasoningpart.py +1 -1
orq_ai_sdk/models/responsedoneevent.py +14 -11
orq_ai_sdk/models/retrieveagentrequestop.py +382 -0
orq_ai_sdk/models/retrievedatapointop.py +4 -4
orq_ai_sdk/models/retrievedatasetop.py +1 -1
orq_ai_sdk/models/retrievedatasourceop.py +1 -1
orq_ai_sdk/models/retrieveidentityop.py +1 -1
orq_ai_sdk/models/retrievememoryop.py +4 -2
orq_ai_sdk/models/retrievetoolop.py +6 -6
orq_ai_sdk/models/runagentop.py +379 -9
orq_ai_sdk/models/streamrunagentop.py +385 -9
orq_ai_sdk/models/updateagentop.py +770 -12
orq_ai_sdk/models/updateconversationop.py +1 -1
orq_ai_sdk/models/updatedatapointop.py +4 -4
orq_ai_sdk/models/updatedatasetop.py +1 -1
orq_ai_sdk/models/updatedatasourceop.py +1 -1
orq_ai_sdk/models/updateevalop.py +14 -14
orq_ai_sdk/models/updateidentityop.py +1 -1
orq_ai_sdk/models/updatememoryop.py +4 -2
orq_ai_sdk/models/updatepromptop.py +375 -6
orq_ai_sdk/models/updatetoolop.py +7 -7
orq_ai_sdk/moderations.py +218 -0
orq_ai_sdk/orq_completions.py +666 -0
orq_ai_sdk/orq_responses.py +398 -0
orq_ai_sdk/rerank.py +330 -0
orq_ai_sdk/router.py +89 -641
orq_ai_sdk/speech.py +333 -0
orq_ai_sdk/transcriptions.py +416 -0
orq_ai_sdk/translations.py +384 -0
orq_ai_sdk/variations.py +364 -0
orq_ai_sdk-4.2.15.dist-info/METADATA +888 -0
{orq_ai_sdk-4.2.0rc49.dist-info → orq_ai_sdk-4.2.15.dist-info}/RECORD +99 -76
{orq_ai_sdk-4.2.0rc49.dist-info → orq_ai_sdk-4.2.15.dist-info}/WHEEL +1 -1
orq_ai_sdk/models/deletecontactop.py +0 -44
orq_ai_sdk/models/listcontactsop.py +0 -265
orq_ai_sdk/models/retrievecontactop.py +0 -142
orq_ai_sdk/models/updatecontactop.py +0 -233
orq_ai_sdk-4.2.0rc49.dist-info/METADATA +0 -788
{orq_ai_sdk-4.2.0rc49.dist-info → orq_ai_sdk-4.2.15.dist-info}/top_level.txt +0 -0

orq_ai_sdk/models/updateagentop.py CHANGED Viewed

@@ -382,9 +382,159 @@ class ModelConfigurationGuardrails(BaseModel):
     r"""Determines whether the guardrail runs on the input (user message) or output (model response)."""
+class ModelConfigurationFallbacksTypedDict(TypedDict):
+    model: str
+    r"""Fallback model identifier"""
+class ModelConfigurationFallbacks(BaseModel):
+    model: str
+    r"""Fallback model identifier"""
+class UpdateAgentModelConfigurationRetryTypedDict(TypedDict):
+    r"""Retry configuration for the request"""
+    count: NotRequired[float]
+    r"""Number of retry attempts (1-5)"""
+    on_codes: NotRequired[List[float]]
+    r"""HTTP status codes that trigger retry logic"""
+class UpdateAgentModelConfigurationRetry(BaseModel):
+    r"""Retry configuration for the request"""
+    count: Optional[float] = 3
+    r"""Number of retry attempts (1-5)"""
+    on_codes: Optional[List[float]] = None
+    r"""HTTP status codes that trigger retry logic"""
+    @model_serializer(mode="wrap")
+    def serialize_model(self, handler):
+        optional_fields = set(["count", "on_codes"])
+        serialized = handler(self)
+        m = {}
+        for n, f in type(self).model_fields.items():
+            k = f.alias or n
+            val = serialized.get(k)
+            if val != UNSET_SENTINEL:
+                if val is not None or k not in optional_fields:
+                    m[k] = val
+        return m
+UpdateAgentModelConfigurationType = Literal["exact_match",]
+class ModelConfigurationCacheTypedDict(TypedDict):
+    r"""Cache configuration for the request."""
+    type: UpdateAgentModelConfigurationType
+    ttl: NotRequired[float]
+    r"""Time to live for cached responses in seconds. Maximum 259200 seconds (3 days)."""
+class ModelConfigurationCache(BaseModel):
+    r"""Cache configuration for the request."""
+    type: UpdateAgentModelConfigurationType
+    ttl: Optional[float] = 1800
+    r"""Time to live for cached responses in seconds. Maximum 259200 seconds (3 days)."""
+    @model_serializer(mode="wrap")
+    def serialize_model(self, handler):
+        optional_fields = set(["ttl"])
+        serialized = handler(self)
+        m = {}
+        for n, f in type(self).model_fields.items():
+            k = f.alias or n
+            val = serialized.get(k)
+            if val != UNSET_SENTINEL:
+                if val is not None or k not in optional_fields:
+                    m[k] = val
+        return m
+UpdateAgentLoadBalancerType = Literal["weight_based",]
+class UpdateAgentLoadBalancerModelsTypedDict(TypedDict):
+    model: str
+    r"""Model identifier for load balancing"""
+    weight: NotRequired[float]
+    r"""Weight assigned to this model for load balancing"""
+class UpdateAgentLoadBalancerModels(BaseModel):
+    model: str
+    r"""Model identifier for load balancing"""
+    weight: Optional[float] = 0.5
+    r"""Weight assigned to this model for load balancing"""
+    @model_serializer(mode="wrap")
+    def serialize_model(self, handler):
+        optional_fields = set(["weight"])
+        serialized = handler(self)
+        m = {}
+        for n, f in type(self).model_fields.items():
+            k = f.alias or n
+            val = serialized.get(k)
+            if val != UNSET_SENTINEL:
+                if val is not None or k not in optional_fields:
+                    m[k] = val
+        return m
+class UpdateAgentLoadBalancer1TypedDict(TypedDict):
+    type: UpdateAgentLoadBalancerType
+    models: List[UpdateAgentLoadBalancerModelsTypedDict]
+class UpdateAgentLoadBalancer1(BaseModel):
+    type: UpdateAgentLoadBalancerType
+    models: List[UpdateAgentLoadBalancerModels]
+ModelConfigurationLoadBalancerTypedDict = UpdateAgentLoadBalancer1TypedDict
+r"""Load balancer configuration for the request."""
+ModelConfigurationLoadBalancer = UpdateAgentLoadBalancer1
+r"""Load balancer configuration for the request."""
+class ModelConfigurationTimeoutTypedDict(TypedDict):
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
+    call_timeout: float
+    r"""Timeout value in milliseconds"""
+class ModelConfigurationTimeout(BaseModel):
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
+    call_timeout: float
+    r"""Timeout value in milliseconds"""
 class ModelConfigurationParametersTypedDict(TypedDict):
     r"""Model behavior parameters that control how the model generates responses. Common parameters: `temperature` (0-1, randomness), `max_completion_tokens` (max output length), `top_p` (sampling diversity). Advanced: `frequency_penalty`, `presence_penalty`, `response_format` (JSON/structured), `reasoning_effort`, `seed` (reproducibility). Support varies by model - consult AI Gateway documentation."""
+    name: NotRequired[str]
+    r"""The name to display on the trace. If not specified, the default system name will be used."""
     audio: NotRequired[Nullable[UpdateAgentModelConfigurationAudioTypedDict]]
     r"""Parameters for audio output. Required when audio output is requested with modalities: [\"audio\"]. Learn more."""
     frequency_penalty: NotRequired[Nullable[float]]
@@ -439,11 +589,24 @@ class ModelConfigurationParametersTypedDict(TypedDict):
     r"""Output types that you would like the model to generate. Most models are capable of generating text, which is the default: [\"text\"]. The gpt-4o-audio-preview model can also be used to generate audio. To request that this model generate both text and audio responses, you can use: [\"text\", \"audio\"]."""
     guardrails: NotRequired[List[ModelConfigurationGuardrailsTypedDict]]
     r"""A list of guardrails to apply to the request."""
+    fallbacks: NotRequired[List[ModelConfigurationFallbacksTypedDict]]
+    r"""Array of fallback models to use if primary model fails"""
+    retry: NotRequired[UpdateAgentModelConfigurationRetryTypedDict]
+    r"""Retry configuration for the request"""
+    cache: NotRequired[ModelConfigurationCacheTypedDict]
+    r"""Cache configuration for the request."""
+    load_balancer: NotRequired[ModelConfigurationLoadBalancerTypedDict]
+    r"""Load balancer configuration for the request."""
+    timeout: NotRequired[ModelConfigurationTimeoutTypedDict]
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
 class ModelConfigurationParameters(BaseModel):
     r"""Model behavior parameters that control how the model generates responses. Common parameters: `temperature` (0-1, randomness), `max_completion_tokens` (max output length), `top_p` (sampling diversity). Advanced: `frequency_penalty`, `presence_penalty`, `response_format` (JSON/structured), `reasoning_effort`, `seed` (reproducibility). Support varies by model - consult AI Gateway documentation."""
+    name: Optional[str] = None
+    r"""The name to display on the trace. If not specified, the default system name will be used."""
     audio: OptionalNullable[UpdateAgentModelConfigurationAudio] = UNSET
     r"""Parameters for audio output. Required when audio output is requested with modalities: [\"audio\"]. Learn more."""
@@ -520,10 +683,26 @@ class ModelConfigurationParameters(BaseModel):
     guardrails: Optional[List[ModelConfigurationGuardrails]] = None
     r"""A list of guardrails to apply to the request."""
+    fallbacks: Optional[List[ModelConfigurationFallbacks]] = None
+    r"""Array of fallback models to use if primary model fails"""
+    retry: Optional[UpdateAgentModelConfigurationRetry] = None
+    r"""Retry configuration for the request"""
+    cache: Optional[ModelConfigurationCache] = None
+    r"""Cache configuration for the request."""
+    load_balancer: Optional[ModelConfigurationLoadBalancer] = None
+    r"""Load balancer configuration for the request."""
+    timeout: Optional[ModelConfigurationTimeout] = None
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
     @model_serializer(mode="wrap")
     def serialize_model(self, handler):
         optional_fields = set(
             [
+                "name",
                 "audio",
                 "frequency_penalty",
                 "max_tokens",
@@ -546,6 +725,11 @@ class ModelConfigurationParameters(BaseModel):
                 "parallel_tool_calls",
                 "modalities",
                 "guardrails",
+                "fallbacks",
+                "retry",
+                "cache",
+                "load_balancer",
+                "timeout",
             ]
         )
         nullable_fields = set(
@@ -589,7 +773,7 @@ class ModelConfigurationParameters(BaseModel):
         return m
-class ModelConfigurationRetryTypedDict(TypedDict):
+class UpdateAgentModelConfigurationAgentsRetryTypedDict(TypedDict):
     r"""Retry configuration for model requests. Retries are triggered for specific HTTP status codes (e.g., 500, 429, 502, 503, 504). Supports configurable retry count (1-5) and custom status codes."""
     count: NotRequired[float]
@@ -598,7 +782,7 @@ class ModelConfigurationRetryTypedDict(TypedDict):
     r"""HTTP status codes that trigger retry logic"""
-class ModelConfigurationRetry(BaseModel):
+class UpdateAgentModelConfigurationAgentsRetry(BaseModel):
     r"""Retry configuration for model requests. Retries are triggered for specific HTTP status codes (e.g., 500, 429, 502, 503, 504). Supports configurable retry count (1-5) and custom status codes."""
     count: Optional[float] = 3
@@ -634,7 +818,7 @@ class UpdateAgentModelConfiguration2TypedDict(TypedDict):
     r"""A model ID string (e.g., `openai/gpt-4o` or `anthropic/claude-haiku-4-5-20251001`). Only models that support tool calling can be used with agents."""
     parameters: NotRequired[ModelConfigurationParametersTypedDict]
     r"""Model behavior parameters that control how the model generates responses. Common parameters: `temperature` (0-1, randomness), `max_completion_tokens` (max output length), `top_p` (sampling diversity). Advanced: `frequency_penalty`, `presence_penalty`, `response_format` (JSON/structured), `reasoning_effort`, `seed` (reproducibility). Support varies by model - consult AI Gateway documentation."""
-    retry: NotRequired[ModelConfigurationRetryTypedDict]
+    retry: NotRequired[UpdateAgentModelConfigurationAgentsRetryTypedDict]
     r"""Retry configuration for model requests. Retries are triggered for specific HTTP status codes (e.g., 500, 429, 502, 503, 504). Supports configurable retry count (1-5) and custom status codes."""
@@ -650,7 +834,7 @@ class UpdateAgentModelConfiguration2(BaseModel):
     parameters: Optional[ModelConfigurationParameters] = None
     r"""Model behavior parameters that control how the model generates responses. Common parameters: `temperature` (0-1, randomness), `max_completion_tokens` (max output length), `top_p` (sampling diversity). Advanced: `frequency_penalty`, `presence_penalty`, `response_format` (JSON/structured), `reasoning_effort`, `seed` (reproducibility). Support varies by model - consult AI Gateway documentation."""
-    retry: Optional[ModelConfigurationRetry] = None
+    retry: Optional[UpdateAgentModelConfigurationAgentsRetry] = None
     r"""Retry configuration for model requests. Retries are triggered for specific HTTP status codes (e.g., 500, 429, 502, 503, 504). Supports configurable retry count (1-5) and custom status codes."""
     @model_serializer(mode="wrap")
@@ -1042,9 +1226,161 @@ class UpdateAgentFallbackModelConfigurationGuardrails(BaseModel):
     r"""Determines whether the guardrail runs on the input (user message) or output (model response)."""
+class UpdateAgentFallbackModelConfigurationFallbacksTypedDict(TypedDict):
+    model: str
+    r"""Fallback model identifier"""
+class UpdateAgentFallbackModelConfigurationFallbacks(BaseModel):
+    model: str
+    r"""Fallback model identifier"""
+class UpdateAgentFallbackModelConfigurationRetryTypedDict(TypedDict):
+    r"""Retry configuration for the request"""
+    count: NotRequired[float]
+    r"""Number of retry attempts (1-5)"""
+    on_codes: NotRequired[List[float]]
+    r"""HTTP status codes that trigger retry logic"""
+class UpdateAgentFallbackModelConfigurationRetry(BaseModel):
+    r"""Retry configuration for the request"""
+    count: Optional[float] = 3
+    r"""Number of retry attempts (1-5)"""
+    on_codes: Optional[List[float]] = None
+    r"""HTTP status codes that trigger retry logic"""
+    @model_serializer(mode="wrap")
+    def serialize_model(self, handler):
+        optional_fields = set(["count", "on_codes"])
+        serialized = handler(self)
+        m = {}
+        for n, f in type(self).model_fields.items():
+            k = f.alias or n
+            val = serialized.get(k)
+            if val != UNSET_SENTINEL:
+                if val is not None or k not in optional_fields:
+                    m[k] = val
+        return m
+UpdateAgentFallbackModelConfigurationType = Literal["exact_match",]
+class UpdateAgentFallbackModelConfigurationCacheTypedDict(TypedDict):
+    r"""Cache configuration for the request."""
+    type: UpdateAgentFallbackModelConfigurationType
+    ttl: NotRequired[float]
+    r"""Time to live for cached responses in seconds. Maximum 259200 seconds (3 days)."""
+class UpdateAgentFallbackModelConfigurationCache(BaseModel):
+    r"""Cache configuration for the request."""
+    type: UpdateAgentFallbackModelConfigurationType
+    ttl: Optional[float] = 1800
+    r"""Time to live for cached responses in seconds. Maximum 259200 seconds (3 days)."""
+    @model_serializer(mode="wrap")
+    def serialize_model(self, handler):
+        optional_fields = set(["ttl"])
+        serialized = handler(self)
+        m = {}
+        for n, f in type(self).model_fields.items():
+            k = f.alias or n
+            val = serialized.get(k)
+            if val != UNSET_SENTINEL:
+                if val is not None or k not in optional_fields:
+                    m[k] = val
+        return m
+UpdateAgentLoadBalancerAgentsType = Literal["weight_based",]
+class UpdateAgentLoadBalancerAgentsModelsTypedDict(TypedDict):
+    model: str
+    r"""Model identifier for load balancing"""
+    weight: NotRequired[float]
+    r"""Weight assigned to this model for load balancing"""
+class UpdateAgentLoadBalancerAgentsModels(BaseModel):
+    model: str
+    r"""Model identifier for load balancing"""
+    weight: Optional[float] = 0.5
+    r"""Weight assigned to this model for load balancing"""
+    @model_serializer(mode="wrap")
+    def serialize_model(self, handler):
+        optional_fields = set(["weight"])
+        serialized = handler(self)
+        m = {}
+        for n, f in type(self).model_fields.items():
+            k = f.alias or n
+            val = serialized.get(k)
+            if val != UNSET_SENTINEL:
+                if val is not None or k not in optional_fields:
+                    m[k] = val
+        return m
+class UpdateAgentLoadBalancerAgents1TypedDict(TypedDict):
+    type: UpdateAgentLoadBalancerAgentsType
+    models: List[UpdateAgentLoadBalancerAgentsModelsTypedDict]
+class UpdateAgentLoadBalancerAgents1(BaseModel):
+    type: UpdateAgentLoadBalancerAgentsType
+    models: List[UpdateAgentLoadBalancerAgentsModels]
+UpdateAgentFallbackModelConfigurationLoadBalancerTypedDict = (
+    UpdateAgentLoadBalancerAgents1TypedDict
+)
+r"""Load balancer configuration for the request."""
+UpdateAgentFallbackModelConfigurationLoadBalancer = UpdateAgentLoadBalancerAgents1
+r"""Load balancer configuration for the request."""
+class UpdateAgentFallbackModelConfigurationTimeoutTypedDict(TypedDict):
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
+    call_timeout: float
+    r"""Timeout value in milliseconds"""
+class UpdateAgentFallbackModelConfigurationTimeout(BaseModel):
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
+    call_timeout: float
+    r"""Timeout value in milliseconds"""
 class UpdateAgentFallbackModelConfigurationParametersTypedDict(TypedDict):
     r"""Optional model parameters specific to this fallback model. Overrides primary model parameters if this fallback is used."""
+    name: NotRequired[str]
+    r"""The name to display on the trace. If not specified, the default system name will be used."""
     audio: NotRequired[Nullable[UpdateAgentFallbackModelConfigurationAudioTypedDict]]
     r"""Parameters for audio output. Required when audio output is requested with modalities: [\"audio\"]. Learn more."""
     frequency_penalty: NotRequired[Nullable[float]]
@@ -1107,11 +1443,28 @@ class UpdateAgentFallbackModelConfigurationParametersTypedDict(TypedDict):
         List[UpdateAgentFallbackModelConfigurationGuardrailsTypedDict]
     ]
     r"""A list of guardrails to apply to the request."""
+    fallbacks: NotRequired[
+        List[UpdateAgentFallbackModelConfigurationFallbacksTypedDict]
+    ]
+    r"""Array of fallback models to use if primary model fails"""
+    retry: NotRequired[UpdateAgentFallbackModelConfigurationRetryTypedDict]
+    r"""Retry configuration for the request"""
+    cache: NotRequired[UpdateAgentFallbackModelConfigurationCacheTypedDict]
+    r"""Cache configuration for the request."""
+    load_balancer: NotRequired[
+        UpdateAgentFallbackModelConfigurationLoadBalancerTypedDict
+    ]
+    r"""Load balancer configuration for the request."""
+    timeout: NotRequired[UpdateAgentFallbackModelConfigurationTimeoutTypedDict]
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
 class UpdateAgentFallbackModelConfigurationParameters(BaseModel):
     r"""Optional model parameters specific to this fallback model. Overrides primary model parameters if this fallback is used."""
+    name: Optional[str] = None
+    r"""The name to display on the trace. If not specified, the default system name will be used."""
     audio: OptionalNullable[UpdateAgentFallbackModelConfigurationAudio] = UNSET
     r"""Parameters for audio output. Required when audio output is requested with modalities: [\"audio\"]. Learn more."""
@@ -1196,10 +1549,26 @@ class UpdateAgentFallbackModelConfigurationParameters(BaseModel):
     guardrails: Optional[List[UpdateAgentFallbackModelConfigurationGuardrails]] = None
     r"""A list of guardrails to apply to the request."""
+    fallbacks: Optional[List[UpdateAgentFallbackModelConfigurationFallbacks]] = None
+    r"""Array of fallback models to use if primary model fails"""
+    retry: Optional[UpdateAgentFallbackModelConfigurationRetry] = None
+    r"""Retry configuration for the request"""
+    cache: Optional[UpdateAgentFallbackModelConfigurationCache] = None
+    r"""Cache configuration for the request."""
+    load_balancer: Optional[UpdateAgentFallbackModelConfigurationLoadBalancer] = None
+    r"""Load balancer configuration for the request."""
+    timeout: Optional[UpdateAgentFallbackModelConfigurationTimeout] = None
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
     @model_serializer(mode="wrap")
     def serialize_model(self, handler):
         optional_fields = set(
             [
+                "name",
                 "audio",
                 "frequency_penalty",
                 "max_tokens",
@@ -1222,6 +1591,11 @@ class UpdateAgentFallbackModelConfigurationParameters(BaseModel):
                 "parallel_tool_calls",
                 "modalities",
                 "guardrails",
+                "fallbacks",
+                "retry",
+                "cache",
+                "load_balancer",
+                "timeout",
             ]
         )
         nullable_fields = set(
@@ -1265,7 +1639,7 @@ class UpdateAgentFallbackModelConfigurationParameters(BaseModel):
         return m
-class UpdateAgentFallbackModelConfigurationRetryTypedDict(TypedDict):
+class UpdateAgentFallbackModelConfigurationAgentsRetryTypedDict(TypedDict):
     r"""Retry configuration for this fallback model. Allows customizing retry count (1-5) and HTTP status codes that trigger retries."""
     count: NotRequired[float]
@@ -1274,7 +1648,7 @@ class UpdateAgentFallbackModelConfigurationRetryTypedDict(TypedDict):
     r"""HTTP status codes that trigger retry logic"""
-class UpdateAgentFallbackModelConfigurationRetry(BaseModel):
+class UpdateAgentFallbackModelConfigurationAgentsRetry(BaseModel):
     r"""Retry configuration for this fallback model. Allows customizing retry count (1-5) and HTTP status codes that trigger retries."""
     count: Optional[float] = 3
@@ -1307,7 +1681,7 @@ class UpdateAgentFallbackModelConfiguration2TypedDict(TypedDict):
     r"""A fallback model ID string. Must support tool calling."""
     parameters: NotRequired[UpdateAgentFallbackModelConfigurationParametersTypedDict]
     r"""Optional model parameters specific to this fallback model. Overrides primary model parameters if this fallback is used."""
-    retry: NotRequired[UpdateAgentFallbackModelConfigurationRetryTypedDict]
+    retry: NotRequired[UpdateAgentFallbackModelConfigurationAgentsRetryTypedDict]
     r"""Retry configuration for this fallback model. Allows customizing retry count (1-5) and HTTP status codes that trigger retries."""
@@ -1320,7 +1694,7 @@ class UpdateAgentFallbackModelConfiguration2(BaseModel):
     parameters: Optional[UpdateAgentFallbackModelConfigurationParameters] = None
     r"""Optional model parameters specific to this fallback model. Overrides primary model parameters if this fallback is used."""
-    retry: Optional[UpdateAgentFallbackModelConfigurationRetry] = None
+    retry: Optional[UpdateAgentFallbackModelConfigurationAgentsRetry] = None
     r"""Retry configuration for this fallback model. Allows customizing retry count (1-5) and HTTP status codes that trigger retries."""
     @model_serializer(mode="wrap")
@@ -3048,9 +3422,159 @@ class UpdateAgentAgentsResponseGuardrails(BaseModel):
     r"""Determines whether the guardrail runs on the input (user message) or output (model response)."""
+class UpdateAgentFallbacksTypedDict(TypedDict):
+    model: str
+    r"""Fallback model identifier"""
+class UpdateAgentFallbacks(BaseModel):
+    model: str
+    r"""Fallback model identifier"""
+class UpdateAgentAgentsRetryTypedDict(TypedDict):
+    r"""Retry configuration for the request"""
+    count: NotRequired[float]
+    r"""Number of retry attempts (1-5)"""
+    on_codes: NotRequired[List[float]]
+    r"""HTTP status codes that trigger retry logic"""
+class UpdateAgentAgentsRetry(BaseModel):
+    r"""Retry configuration for the request"""
+    count: Optional[float] = 3
+    r"""Number of retry attempts (1-5)"""
+    on_codes: Optional[List[float]] = None
+    r"""HTTP status codes that trigger retry logic"""
+    @model_serializer(mode="wrap")
+    def serialize_model(self, handler):
+        optional_fields = set(["count", "on_codes"])
+        serialized = handler(self)
+        m = {}
+        for n, f in type(self).model_fields.items():
+            k = f.alias or n
+            val = serialized.get(k)
+            if val != UNSET_SENTINEL:
+                if val is not None or k not in optional_fields:
+                    m[k] = val
+        return m
+UpdateAgentType = Literal["exact_match",]
+class UpdateAgentCacheTypedDict(TypedDict):
+    r"""Cache configuration for the request."""
+    type: UpdateAgentType
+    ttl: NotRequired[float]
+    r"""Time to live for cached responses in seconds. Maximum 259200 seconds (3 days)."""
+class UpdateAgentCache(BaseModel):
+    r"""Cache configuration for the request."""
+    type: UpdateAgentType
+    ttl: Optional[float] = 1800
+    r"""Time to live for cached responses in seconds. Maximum 259200 seconds (3 days)."""
+    @model_serializer(mode="wrap")
+    def serialize_model(self, handler):
+        optional_fields = set(["ttl"])
+        serialized = handler(self)
+        m = {}
+        for n, f in type(self).model_fields.items():
+            k = f.alias or n
+            val = serialized.get(k)
+            if val != UNSET_SENTINEL:
+                if val is not None or k not in optional_fields:
+                    m[k] = val
+        return m
+UpdateAgentLoadBalancerAgentsResponseType = Literal["weight_based",]
+class UpdateAgentLoadBalancerAgentsResponseModelsTypedDict(TypedDict):
+    model: str
+    r"""Model identifier for load balancing"""
+    weight: NotRequired[float]
+    r"""Weight assigned to this model for load balancing"""
+class UpdateAgentLoadBalancerAgentsResponseModels(BaseModel):
+    model: str
+    r"""Model identifier for load balancing"""
+    weight: Optional[float] = 0.5
+    r"""Weight assigned to this model for load balancing"""
+    @model_serializer(mode="wrap")
+    def serialize_model(self, handler):
+        optional_fields = set(["weight"])
+        serialized = handler(self)
+        m = {}
+        for n, f in type(self).model_fields.items():
+            k = f.alias or n
+            val = serialized.get(k)
+            if val != UNSET_SENTINEL:
+                if val is not None or k not in optional_fields:
+                    m[k] = val
+        return m
+class UpdateAgentLoadBalancerAgentsResponse1TypedDict(TypedDict):
+    type: UpdateAgentLoadBalancerAgentsResponseType
+    models: List[UpdateAgentLoadBalancerAgentsResponseModelsTypedDict]
+class UpdateAgentLoadBalancerAgentsResponse1(BaseModel):
+    type: UpdateAgentLoadBalancerAgentsResponseType
+    models: List[UpdateAgentLoadBalancerAgentsResponseModels]
+UpdateAgentLoadBalancerTypedDict = UpdateAgentLoadBalancerAgentsResponse1TypedDict
+r"""Load balancer configuration for the request."""
+UpdateAgentLoadBalancer = UpdateAgentLoadBalancerAgentsResponse1
+r"""Load balancer configuration for the request."""
+class UpdateAgentTimeoutTypedDict(TypedDict):
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
+    call_timeout: float
+    r"""Timeout value in milliseconds"""
+class UpdateAgentTimeout(BaseModel):
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
+    call_timeout: float
+    r"""Timeout value in milliseconds"""
 class UpdateAgentParametersTypedDict(TypedDict):
     r"""Model behavior parameters (snake_case) stored as part of the agent configuration. These become the default parameters used when the agent is executed. Commonly used: temperature (0-1, controls randomness), max_completion_tokens (response length), top_p (nucleus sampling). Advanced: frequency_penalty, presence_penalty, response_format (JSON/structured output), reasoning_effort (for o1/thinking models), seed (reproducibility), stop sequences. Model-specific support varies. Runtime parameters in agent execution requests can override these defaults."""
+    name: NotRequired[str]
+    r"""The name to display on the trace. If not specified, the default system name will be used."""
     audio: NotRequired[Nullable[UpdateAgentAudioTypedDict]]
     r"""Parameters for audio output. Required when audio output is requested with modalities: [\"audio\"]. Learn more."""
     frequency_penalty: NotRequired[Nullable[float]]
@@ -3105,11 +3629,24 @@ class UpdateAgentParametersTypedDict(TypedDict):
     r"""Output types that you would like the model to generate. Most models are capable of generating text, which is the default: [\"text\"]. The gpt-4o-audio-preview model can also be used to generate audio. To request that this model generate both text and audio responses, you can use: [\"text\", \"audio\"]."""
     guardrails: NotRequired[List[UpdateAgentAgentsResponseGuardrailsTypedDict]]
     r"""A list of guardrails to apply to the request."""
+    fallbacks: NotRequired[List[UpdateAgentFallbacksTypedDict]]
+    r"""Array of fallback models to use if primary model fails"""
+    retry: NotRequired[UpdateAgentAgentsRetryTypedDict]
+    r"""Retry configuration for the request"""
+    cache: NotRequired[UpdateAgentCacheTypedDict]
+    r"""Cache configuration for the request."""
+    load_balancer: NotRequired[UpdateAgentLoadBalancerTypedDict]
+    r"""Load balancer configuration for the request."""
+    timeout: NotRequired[UpdateAgentTimeoutTypedDict]
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
 class UpdateAgentParameters(BaseModel):
     r"""Model behavior parameters (snake_case) stored as part of the agent configuration. These become the default parameters used when the agent is executed. Commonly used: temperature (0-1, controls randomness), max_completion_tokens (response length), top_p (nucleus sampling). Advanced: frequency_penalty, presence_penalty, response_format (JSON/structured output), reasoning_effort (for o1/thinking models), seed (reproducibility), stop sequences. Model-specific support varies. Runtime parameters in agent execution requests can override these defaults."""
+    name: Optional[str] = None
+    r"""The name to display on the trace. If not specified, the default system name will be used."""
     audio: OptionalNullable[UpdateAgentAudio] = UNSET
     r"""Parameters for audio output. Required when audio output is requested with modalities: [\"audio\"]. Learn more."""
@@ -3186,10 +3723,26 @@ class UpdateAgentParameters(BaseModel):
     guardrails: Optional[List[UpdateAgentAgentsResponseGuardrails]] = None
     r"""A list of guardrails to apply to the request."""
+    fallbacks: Optional[List[UpdateAgentFallbacks]] = None
+    r"""Array of fallback models to use if primary model fails"""
+    retry: Optional[UpdateAgentAgentsRetry] = None
+    r"""Retry configuration for the request"""
+    cache: Optional[UpdateAgentCache] = None
+    r"""Cache configuration for the request."""
+    load_balancer: Optional[UpdateAgentLoadBalancer] = None
+    r"""Load balancer configuration for the request."""
+    timeout: Optional[UpdateAgentTimeout] = None
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
     @model_serializer(mode="wrap")
     def serialize_model(self, handler):
         optional_fields = set(
             [
+                "name",
                 "audio",
                 "frequency_penalty",
                 "max_tokens",
@@ -3212,6 +3765,11 @@ class UpdateAgentParameters(BaseModel):
                 "parallel_tool_calls",
                 "modalities",
                 "guardrails",
+                "fallbacks",
+                "retry",
+                "cache",
+                "load_balancer",
+                "timeout",
             ]
         )
         nullable_fields = set(
@@ -3672,9 +4230,163 @@ class UpdateAgentFallbackModelConfigurationAgentsGuardrails(BaseModel):
     r"""Determines whether the guardrail runs on the input (user message) or output (model response)."""
+class UpdateAgentFallbackModelConfigurationAgentsFallbacksTypedDict(TypedDict):
+    model: str
+    r"""Fallback model identifier"""
+class UpdateAgentFallbackModelConfigurationAgentsFallbacks(BaseModel):
+    model: str
+    r"""Fallback model identifier"""
+class UpdateAgentFallbackModelConfigurationAgentsResponse200RetryTypedDict(TypedDict):
+    r"""Retry configuration for the request"""
+    count: NotRequired[float]
+    r"""Number of retry attempts (1-5)"""
+    on_codes: NotRequired[List[float]]
+    r"""HTTP status codes that trigger retry logic"""
+class UpdateAgentFallbackModelConfigurationAgentsResponse200Retry(BaseModel):
+    r"""Retry configuration for the request"""
+    count: Optional[float] = 3
+    r"""Number of retry attempts (1-5)"""
+    on_codes: Optional[List[float]] = None
+    r"""HTTP status codes that trigger retry logic"""
+    @model_serializer(mode="wrap")
+    def serialize_model(self, handler):
+        optional_fields = set(["count", "on_codes"])
+        serialized = handler(self)
+        m = {}
+        for n, f in type(self).model_fields.items():
+            k = f.alias or n
+            val = serialized.get(k)
+            if val != UNSET_SENTINEL:
+                if val is not None or k not in optional_fields:
+                    m[k] = val
+        return m
+UpdateAgentFallbackModelConfigurationAgentsType = Literal["exact_match",]
+class UpdateAgentFallbackModelConfigurationAgentsCacheTypedDict(TypedDict):
+    r"""Cache configuration for the request."""
+    type: UpdateAgentFallbackModelConfigurationAgentsType
+    ttl: NotRequired[float]
+    r"""Time to live for cached responses in seconds. Maximum 259200 seconds (3 days)."""
+class UpdateAgentFallbackModelConfigurationAgentsCache(BaseModel):
+    r"""Cache configuration for the request."""
+    type: UpdateAgentFallbackModelConfigurationAgentsType
+    ttl: Optional[float] = 1800
+    r"""Time to live for cached responses in seconds. Maximum 259200 seconds (3 days)."""
+    @model_serializer(mode="wrap")
+    def serialize_model(self, handler):
+        optional_fields = set(["ttl"])
+        serialized = handler(self)
+        m = {}
+        for n, f in type(self).model_fields.items():
+            k = f.alias or n
+            val = serialized.get(k)
+            if val != UNSET_SENTINEL:
+                if val is not None or k not in optional_fields:
+                    m[k] = val
+        return m
+UpdateAgentLoadBalancerAgentsResponse200Type = Literal["weight_based",]
+class UpdateAgentLoadBalancerAgentsResponse200ModelsTypedDict(TypedDict):
+    model: str
+    r"""Model identifier for load balancing"""
+    weight: NotRequired[float]
+    r"""Weight assigned to this model for load balancing"""
+class UpdateAgentLoadBalancerAgentsResponse200Models(BaseModel):
+    model: str
+    r"""Model identifier for load balancing"""
+    weight: Optional[float] = 0.5
+    r"""Weight assigned to this model for load balancing"""
+    @model_serializer(mode="wrap")
+    def serialize_model(self, handler):
+        optional_fields = set(["weight"])
+        serialized = handler(self)
+        m = {}
+        for n, f in type(self).model_fields.items():
+            k = f.alias or n
+            val = serialized.get(k)
+            if val != UNSET_SENTINEL:
+                if val is not None or k not in optional_fields:
+                    m[k] = val
+        return m
+class UpdateAgentLoadBalancerAgentsResponse2001TypedDict(TypedDict):
+    type: UpdateAgentLoadBalancerAgentsResponse200Type
+    models: List[UpdateAgentLoadBalancerAgentsResponse200ModelsTypedDict]
+class UpdateAgentLoadBalancerAgentsResponse2001(BaseModel):
+    type: UpdateAgentLoadBalancerAgentsResponse200Type
+    models: List[UpdateAgentLoadBalancerAgentsResponse200Models]
+UpdateAgentFallbackModelConfigurationAgentsLoadBalancerTypedDict = (
+    UpdateAgentLoadBalancerAgentsResponse2001TypedDict
+)
+r"""Load balancer configuration for the request."""
+UpdateAgentFallbackModelConfigurationAgentsLoadBalancer = (
+    UpdateAgentLoadBalancerAgentsResponse2001
+)
+r"""Load balancer configuration for the request."""
+class UpdateAgentFallbackModelConfigurationAgentsTimeoutTypedDict(TypedDict):
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
+    call_timeout: float
+    r"""Timeout value in milliseconds"""
+class UpdateAgentFallbackModelConfigurationAgentsTimeout(BaseModel):
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
+    call_timeout: float
+    r"""Timeout value in milliseconds"""
 class UpdateAgentFallbackModelConfigurationAgentsParametersTypedDict(TypedDict):
     r"""Optional model parameters specific to this fallback model. Overrides primary model parameters if this fallback is used."""
+    name: NotRequired[str]
+    r"""The name to display on the trace. If not specified, the default system name will be used."""
     audio: NotRequired[
         Nullable[UpdateAgentFallbackModelConfigurationAgentsAudioTypedDict]
     ]
@@ -3745,11 +4457,30 @@ class UpdateAgentFallbackModelConfigurationAgentsParametersTypedDict(TypedDict):
         List[UpdateAgentFallbackModelConfigurationAgentsGuardrailsTypedDict]
     ]
     r"""A list of guardrails to apply to the request."""
+    fallbacks: NotRequired[
+        List[UpdateAgentFallbackModelConfigurationAgentsFallbacksTypedDict]
+    ]
+    r"""Array of fallback models to use if primary model fails"""
+    retry: NotRequired[
+        UpdateAgentFallbackModelConfigurationAgentsResponse200RetryTypedDict
+    ]
+    r"""Retry configuration for the request"""
+    cache: NotRequired[UpdateAgentFallbackModelConfigurationAgentsCacheTypedDict]
+    r"""Cache configuration for the request."""
+    load_balancer: NotRequired[
+        UpdateAgentFallbackModelConfigurationAgentsLoadBalancerTypedDict
+    ]
+    r"""Load balancer configuration for the request."""
+    timeout: NotRequired[UpdateAgentFallbackModelConfigurationAgentsTimeoutTypedDict]
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
 class UpdateAgentFallbackModelConfigurationAgentsParameters(BaseModel):
     r"""Optional model parameters specific to this fallback model. Overrides primary model parameters if this fallback is used."""
+    name: Optional[str] = None
+    r"""The name to display on the trace. If not specified, the default system name will be used."""
     audio: OptionalNullable[UpdateAgentFallbackModelConfigurationAgentsAudio] = UNSET
     r"""Parameters for audio output. Required when audio output is requested with modalities: [\"audio\"]. Learn more."""
@@ -3836,10 +4567,30 @@ class UpdateAgentFallbackModelConfigurationAgentsParameters(BaseModel):
     ] = None
     r"""A list of guardrails to apply to the request."""
+    fallbacks: Optional[List[UpdateAgentFallbackModelConfigurationAgentsFallbacks]] = (
+        None
+    )
+    r"""Array of fallback models to use if primary model fails"""
+    retry: Optional[UpdateAgentFallbackModelConfigurationAgentsResponse200Retry] = None
+    r"""Retry configuration for the request"""
+    cache: Optional[UpdateAgentFallbackModelConfigurationAgentsCache] = None
+    r"""Cache configuration for the request."""
+    load_balancer: Optional[UpdateAgentFallbackModelConfigurationAgentsLoadBalancer] = (
+        None
+    )
+    r"""Load balancer configuration for the request."""
+    timeout: Optional[UpdateAgentFallbackModelConfigurationAgentsTimeout] = None
+    r"""Timeout configuration to apply to the request. If the request exceeds the timeout, it will be retried or fallback to the next model if configured."""
     @model_serializer(mode="wrap")
     def serialize_model(self, handler):
         optional_fields = set(
             [
+                "name",
                 "audio",
                 "frequency_penalty",
                 "max_tokens",
@@ -3862,6 +4613,11 @@ class UpdateAgentFallbackModelConfigurationAgentsParameters(BaseModel):
                 "parallel_tool_calls",
                 "modalities",
                 "guardrails",
+                "fallbacks",
+                "retry",
+                "cache",
+                "load_balancer",
+                "timeout",
             ]
         )
         nullable_fields = set(
@@ -3905,7 +4661,7 @@ class UpdateAgentFallbackModelConfigurationAgentsParameters(BaseModel):
         return m
-class UpdateAgentFallbackModelConfigurationAgentsRetryTypedDict(TypedDict):
+class UpdateAgentFallbackModelConfigurationAgentsResponseRetryTypedDict(TypedDict):
     r"""Retry configuration for this fallback model. Allows customizing retry count (1-5) and HTTP status codes that trigger retries."""
     count: NotRequired[float]
@@ -3914,7 +4670,7 @@ class UpdateAgentFallbackModelConfigurationAgentsRetryTypedDict(TypedDict):
     r"""HTTP status codes that trigger retry logic"""
-class UpdateAgentFallbackModelConfigurationAgentsRetry(BaseModel):
+class UpdateAgentFallbackModelConfigurationAgentsResponseRetry(BaseModel):
     r"""Retry configuration for this fallback model. Allows customizing retry count (1-5) and HTTP status codes that trigger retries."""
     count: Optional[float] = 3
@@ -3949,7 +4705,9 @@ class UpdateAgentFallbackModelConfigurationAgents2TypedDict(TypedDict):
         UpdateAgentFallbackModelConfigurationAgentsParametersTypedDict
     ]
     r"""Optional model parameters specific to this fallback model. Overrides primary model parameters if this fallback is used."""
-    retry: NotRequired[UpdateAgentFallbackModelConfigurationAgentsRetryTypedDict]
+    retry: NotRequired[
+        UpdateAgentFallbackModelConfigurationAgentsResponseRetryTypedDict
+    ]
     r"""Retry configuration for this fallback model. Allows customizing retry count (1-5) and HTTP status codes that trigger retries."""
@@ -3962,7 +4720,7 @@ class UpdateAgentFallbackModelConfigurationAgents2(BaseModel):
     parameters: Optional[UpdateAgentFallbackModelConfigurationAgentsParameters] = None
     r"""Optional model parameters specific to this fallback model. Overrides primary model parameters if this fallback is used."""
-    retry: Optional[UpdateAgentFallbackModelConfigurationAgentsRetry] = None
+    retry: Optional[UpdateAgentFallbackModelConfigurationAgentsResponseRetry] = None
     r"""Retry configuration for this fallback model. Allows customizing retry count (1-5) and HTTP status codes that trigger retries."""
     @model_serializer(mode="wrap")

orq-ai-sdk 4.2.0rc49__py3-none-any.whl → 4.2.15__py3-none-any.whl

orq-ai-sdk 4.2.0rc49py3-none-any.whl → 4.2.15py3-none-any.whl