PyPI - ag2 - Versions diffs - 0.9.7__py3-none-any.whl → 0.9.9__py3-none-any.whl - Mend

ag2 0.9.7py3-none-any.whl → 0.9.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of ag2 might be problematic. Click here for more details.

Files changed (236) hide show

{ag2-0.9.7.dist-info → ag2-0.9.9.dist-info}/METADATA +102 -75
ag2-0.9.9.dist-info/RECORD +387 -0
autogen/__init__.py +1 -2
autogen/_website/generate_api_references.py +4 -5
autogen/_website/generate_mkdocs.py +9 -15
autogen/_website/notebook_processor.py +13 -14
autogen/_website/process_notebooks.py +10 -10
autogen/_website/utils.py +5 -4
autogen/agentchat/agent.py +13 -13
autogen/agentchat/assistant_agent.py +7 -6
autogen/agentchat/contrib/agent_eval/agent_eval.py +3 -3
autogen/agentchat/contrib/agent_eval/critic_agent.py +3 -3
autogen/agentchat/contrib/agent_eval/quantifier_agent.py +3 -3
autogen/agentchat/contrib/agent_eval/subcritic_agent.py +3 -3
autogen/agentchat/contrib/agent_optimizer.py +3 -3
autogen/agentchat/contrib/capabilities/generate_images.py +11 -11
autogen/agentchat/contrib/capabilities/teachability.py +15 -15
autogen/agentchat/contrib/capabilities/transforms.py +17 -18
autogen/agentchat/contrib/capabilities/transforms_util.py +5 -5
autogen/agentchat/contrib/capabilities/vision_capability.py +4 -3
autogen/agentchat/contrib/captainagent/agent_builder.py +30 -30
autogen/agentchat/contrib/captainagent/captainagent.py +22 -21
autogen/agentchat/contrib/captainagent/tool_retriever.py +2 -3
autogen/agentchat/contrib/gpt_assistant_agent.py +9 -9
autogen/agentchat/contrib/graph_rag/document.py +3 -3
autogen/agentchat/contrib/graph_rag/falkor_graph_query_engine.py +3 -3
autogen/agentchat/contrib/graph_rag/falkor_graph_rag_capability.py +6 -6
autogen/agentchat/contrib/graph_rag/graph_query_engine.py +3 -3
autogen/agentchat/contrib/graph_rag/neo4j_graph_query_engine.py +5 -11
autogen/agentchat/contrib/graph_rag/neo4j_graph_rag_capability.py +6 -6
autogen/agentchat/contrib/graph_rag/neo4j_native_graph_query_engine.py +7 -7
autogen/agentchat/contrib/graph_rag/neo4j_native_graph_rag_capability.py +6 -6
autogen/agentchat/contrib/img_utils.py +1 -1
autogen/agentchat/contrib/llamaindex_conversable_agent.py +11 -11
autogen/agentchat/contrib/llava_agent.py +18 -4
autogen/agentchat/contrib/math_user_proxy_agent.py +11 -11
autogen/agentchat/contrib/multimodal_conversable_agent.py +8 -8
autogen/agentchat/contrib/qdrant_retrieve_user_proxy_agent.py +6 -5
autogen/agentchat/contrib/rag/chromadb_query_engine.py +22 -26
autogen/agentchat/contrib/rag/llamaindex_query_engine.py +14 -17
autogen/agentchat/contrib/rag/mongodb_query_engine.py +27 -37
autogen/agentchat/contrib/rag/query_engine.py +7 -5
autogen/agentchat/contrib/retrieve_assistant_agent.py +5 -5
autogen/agentchat/contrib/retrieve_user_proxy_agent.py +8 -7
autogen/agentchat/contrib/society_of_mind_agent.py +15 -14
autogen/agentchat/contrib/swarm_agent.py +76 -98
autogen/agentchat/contrib/text_analyzer_agent.py +7 -7
autogen/agentchat/contrib/vectordb/base.py +10 -18
autogen/agentchat/contrib/vectordb/chromadb.py +2 -1
autogen/agentchat/contrib/vectordb/couchbase.py +18 -20
autogen/agentchat/contrib/vectordb/mongodb.py +6 -5
autogen/agentchat/contrib/vectordb/pgvectordb.py +40 -41
autogen/agentchat/contrib/vectordb/qdrant.py +5 -5
autogen/agentchat/contrib/web_surfer.py +20 -19
autogen/agentchat/conversable_agent.py +292 -290
autogen/agentchat/group/context_str.py +1 -3
autogen/agentchat/group/context_variables.py +15 -25
autogen/agentchat/group/group_tool_executor.py +10 -10
autogen/agentchat/group/group_utils.py +15 -15
autogen/agentchat/group/guardrails.py +7 -7
autogen/agentchat/group/handoffs.py +19 -36
autogen/agentchat/group/multi_agent_chat.py +7 -7
autogen/agentchat/group/on_condition.py +4 -7
autogen/agentchat/group/on_context_condition.py +4 -7
autogen/agentchat/group/patterns/auto.py +8 -7
autogen/agentchat/group/patterns/manual.py +7 -6
autogen/agentchat/group/patterns/pattern.py +13 -12
autogen/agentchat/group/patterns/random.py +3 -3
autogen/agentchat/group/patterns/round_robin.py +3 -3
autogen/agentchat/group/reply_result.py +2 -4
autogen/agentchat/group/speaker_selection_result.py +5 -5
autogen/agentchat/group/targets/group_chat_target.py +7 -6
autogen/agentchat/group/targets/group_manager_target.py +4 -4
autogen/agentchat/group/targets/transition_target.py +2 -1
autogen/agentchat/groupchat.py +60 -63
autogen/agentchat/realtime/experimental/audio_adapters/twilio_audio_adapter.py +4 -4
autogen/agentchat/realtime/experimental/audio_adapters/websocket_audio_adapter.py +4 -4
autogen/agentchat/realtime/experimental/clients/gemini/client.py +7 -7
autogen/agentchat/realtime/experimental/clients/oai/base_client.py +8 -8
autogen/agentchat/realtime/experimental/clients/oai/rtc_client.py +6 -6
autogen/agentchat/realtime/experimental/clients/realtime_client.py +10 -9
autogen/agentchat/realtime/experimental/realtime_agent.py +10 -9
autogen/agentchat/realtime/experimental/realtime_observer.py +3 -3
autogen/agentchat/realtime/experimental/realtime_swarm.py +44 -44
autogen/agentchat/user_proxy_agent.py +10 -9
autogen/agentchat/utils.py +3 -3
autogen/agents/contrib/time/time_reply_agent.py +6 -5
autogen/agents/contrib/time/time_tool_agent.py +2 -1
autogen/agents/experimental/deep_research/deep_research.py +3 -3
autogen/agents/experimental/discord/discord.py +2 -2
autogen/agents/experimental/document_agent/chroma_query_engine.py +29 -44
autogen/agents/experimental/document_agent/docling_doc_ingest_agent.py +9 -14
autogen/agents/experimental/document_agent/document_agent.py +15 -16
autogen/agents/experimental/document_agent/document_conditions.py +3 -3
autogen/agents/experimental/document_agent/document_utils.py +5 -9
autogen/agents/experimental/document_agent/inmemory_query_engine.py +14 -20
autogen/agents/experimental/document_agent/parser_utils.py +4 -4
autogen/agents/experimental/document_agent/url_utils.py +14 -23
autogen/agents/experimental/reasoning/reasoning_agent.py +33 -33
autogen/agents/experimental/slack/slack.py +2 -2
autogen/agents/experimental/telegram/telegram.py +2 -3
autogen/agents/experimental/websurfer/websurfer.py +4 -4
autogen/agents/experimental/wikipedia/wikipedia.py +5 -7
autogen/browser_utils.py +8 -8
autogen/cache/abstract_cache_base.py +5 -5
autogen/cache/cache.py +12 -12
autogen/cache/cache_factory.py +4 -4
autogen/cache/cosmos_db_cache.py +9 -9
autogen/cache/disk_cache.py +6 -6
autogen/cache/in_memory_cache.py +4 -4
autogen/cache/redis_cache.py +4 -4
autogen/code_utils.py +18 -18
autogen/coding/base.py +6 -6
autogen/coding/docker_commandline_code_executor.py +9 -9
autogen/coding/func_with_reqs.py +7 -6
autogen/coding/jupyter/base.py +3 -3
autogen/coding/jupyter/docker_jupyter_server.py +3 -4
autogen/coding/jupyter/import_utils.py +3 -3
autogen/coding/jupyter/jupyter_client.py +5 -5
autogen/coding/jupyter/jupyter_code_executor.py +3 -4
autogen/coding/jupyter/local_jupyter_server.py +2 -6
autogen/coding/local_commandline_code_executor.py +8 -7
autogen/coding/markdown_code_extractor.py +1 -2
autogen/coding/utils.py +1 -2
autogen/doc_utils.py +3 -2
autogen/environments/docker_python_environment.py +19 -29
autogen/environments/python_environment.py +8 -17
autogen/environments/system_python_environment.py +3 -4
autogen/environments/venv_python_environment.py +8 -12
autogen/environments/working_directory.py +1 -2
autogen/events/agent_events.py +106 -109
autogen/events/base_event.py +6 -5
autogen/events/client_events.py +15 -14
autogen/events/helpers.py +1 -1
autogen/events/print_event.py +4 -5
autogen/fast_depends/_compat.py +10 -15
autogen/fast_depends/core/build.py +17 -36
autogen/fast_depends/core/model.py +64 -113
autogen/fast_depends/dependencies/model.py +2 -1
autogen/fast_depends/dependencies/provider.py +3 -2
autogen/fast_depends/library/model.py +4 -4
autogen/fast_depends/schema.py +7 -7
autogen/fast_depends/use.py +17 -25
autogen/fast_depends/utils.py +10 -30
autogen/formatting_utils.py +6 -6
autogen/graph_utils.py +1 -4
autogen/import_utils.py +38 -27
autogen/interop/crewai/crewai.py +2 -2
autogen/interop/interoperable.py +2 -2
autogen/interop/langchain/langchain_chat_model_factory.py +3 -2
autogen/interop/langchain/langchain_tool.py +2 -6
autogen/interop/litellm/litellm_config_factory.py +6 -7
autogen/interop/pydantic_ai/pydantic_ai.py +4 -7
autogen/interop/registry.py +2 -1
autogen/io/base.py +5 -5
autogen/io/run_response.py +33 -32
autogen/io/websockets.py +6 -5
autogen/json_utils.py +1 -2
autogen/llm_config/__init__.py +11 -0
autogen/llm_config/client.py +58 -0
autogen/llm_config/config.py +384 -0
autogen/llm_config/entry.py +154 -0
autogen/logger/base_logger.py +4 -3
autogen/logger/file_logger.py +2 -1
autogen/logger/logger_factory.py +2 -2
autogen/logger/logger_utils.py +2 -2
autogen/logger/sqlite_logger.py +2 -1
autogen/math_utils.py +4 -5
autogen/mcp/__main__.py +6 -6
autogen/mcp/helpers.py +4 -4
autogen/mcp/mcp_client.py +170 -29
autogen/mcp/mcp_proxy/fastapi_code_generator_helpers.py +3 -4
autogen/mcp/mcp_proxy/mcp_proxy.py +23 -26
autogen/mcp/mcp_proxy/operation_grouping.py +4 -5
autogen/mcp/mcp_proxy/operation_renaming.py +6 -10
autogen/mcp/mcp_proxy/security.py +2 -3
autogen/messages/agent_messages.py +96 -98
autogen/messages/base_message.py +6 -5
autogen/messages/client_messages.py +15 -14
autogen/messages/print_message.py +4 -5
autogen/oai/__init__.py +1 -2
autogen/oai/anthropic.py +42 -41
autogen/oai/bedrock.py +68 -57
autogen/oai/cerebras.py +26 -25
autogen/oai/client.py +113 -139
autogen/oai/client_utils.py +3 -3
autogen/oai/cohere.py +34 -11
autogen/oai/gemini.py +39 -17
autogen/oai/gemini_types.py +11 -12
autogen/oai/groq.py +22 -10
autogen/oai/mistral.py +17 -11
autogen/oai/oai_models/__init__.py +14 -2
autogen/oai/oai_models/_models.py +2 -2
autogen/oai/oai_models/chat_completion.py +13 -14
autogen/oai/oai_models/chat_completion_message.py +11 -9
autogen/oai/oai_models/chat_completion_message_tool_call.py +26 -3
autogen/oai/oai_models/chat_completion_token_logprob.py +3 -4
autogen/oai/oai_models/completion_usage.py +8 -9
autogen/oai/ollama.py +19 -9
autogen/oai/openai_responses.py +40 -17
autogen/oai/openai_utils.py +48 -38
autogen/oai/together.py +29 -14
autogen/retrieve_utils.py +6 -7
autogen/runtime_logging.py +5 -4
autogen/token_count_utils.py +7 -4
autogen/tools/contrib/time/time.py +0 -1
autogen/tools/dependency_injection.py +5 -6
autogen/tools/experimental/browser_use/browser_use.py +10 -10
autogen/tools/experimental/code_execution/python_code_execution.py +5 -7
autogen/tools/experimental/crawl4ai/crawl4ai.py +12 -15
autogen/tools/experimental/deep_research/deep_research.py +9 -8
autogen/tools/experimental/duckduckgo/duckduckgo_search.py +5 -11
autogen/tools/experimental/firecrawl/firecrawl_tool.py +98 -115
autogen/tools/experimental/google/authentication/credentials_local_provider.py +1 -1
autogen/tools/experimental/google/drive/drive_functions.py +4 -4
autogen/tools/experimental/google/drive/toolkit.py +5 -5
autogen/tools/experimental/google_search/google_search.py +5 -5
autogen/tools/experimental/google_search/youtube_search.py +5 -5
autogen/tools/experimental/messageplatform/discord/discord.py +8 -12
autogen/tools/experimental/messageplatform/slack/slack.py +14 -20
autogen/tools/experimental/messageplatform/telegram/telegram.py +8 -12
autogen/tools/experimental/perplexity/perplexity_search.py +18 -29
autogen/tools/experimental/reliable/reliable.py +68 -74
autogen/tools/experimental/searxng/searxng_search.py +20 -19
autogen/tools/experimental/tavily/tavily_search.py +12 -19
autogen/tools/experimental/web_search_preview/web_search_preview.py +13 -7
autogen/tools/experimental/wikipedia/wikipedia.py +7 -10
autogen/tools/function_utils.py +7 -7
autogen/tools/tool.py +8 -6
autogen/types.py +2 -2
autogen/version.py +1 -1
ag2-0.9.7.dist-info/RECORD +0 -421
autogen/llm_config.py +0 -385
{ag2-0.9.7.dist-info → ag2-0.9.9.dist-info}/WHEEL +0 -0
{ag2-0.9.7.dist-info → ag2-0.9.9.dist-info}/licenses/LICENSE +0 -0
{ag2-0.9.7.dist-info → ag2-0.9.9.dist-info}/licenses/NOTICE.md +0 -0

autogen/oai/client.py CHANGED Viewed

@@ -13,10 +13,11 @@ import re
 import sys
 import uuid
 import warnings
+from collections.abc import Callable
 from functools import lru_cache
-from typing import Any, Callable, Literal, Optional, Protocol, Union
+from typing import Any, Literal
-from pydantic import BaseModel, Field, HttpUrl, ValidationInfo, field_validator
+from pydantic import BaseModel, Field, HttpUrl
 from pydantic.type_adapter import TypeAdapter
 from ..cache import Cache
@@ -25,7 +26,8 @@ from ..events.client_events import StreamEvent, UsageSummaryEvent
 from ..exception_utils import ModelToolNotSupportedError
 from ..import_utils import optional_import_block, require_optional_import
 from ..io.base import IOStream
-from ..llm_config import LLMConfigEntry, register_llm_config
+from ..llm_config import ModelClient
+from ..llm_config.entry import LLMConfigEntry, LLMConfigEntryDict
 from ..logger.logger_utils import get_current_ts
 from ..runtime_logging import log_chat_completion, log_new_client, log_new_wrapper, logging_enabled
 from ..token_count_utils import count_token
@@ -58,7 +60,7 @@ if openai_result.is_successful:
     ERROR = None
     from openai.lib._pydantic import _ensure_strict_json_schema
 else:
-    ERROR: Optional[ImportError] = ImportError("Please install openai>=1 and diskcache to use autogen.OpenAIWrapper.")
+    ERROR: ImportError | None = ImportError("Please install openai>=1 and diskcache to use autogen.OpenAIWrapper.")
     # OpenAI = object
     # AzureOpenAI = object
@@ -73,7 +75,7 @@ with optional_import_block() as cerebras_result:
     from .cerebras import CerebrasClient
 if cerebras_result.is_successful:
-    cerebras_import_exception: Optional[ImportError] = None
+    cerebras_import_exception: ImportError | None = None
 else:
     cerebras_AuthenticationError = cerebras_InternalServerError = cerebras_RateLimitError = Exception  # noqa: N816
     cerebras_import_exception = ImportError("cerebras_cloud_sdk not found")
@@ -87,7 +89,7 @@ with optional_import_block() as gemini_result:
     from .gemini import GeminiClient
 if gemini_result.is_successful:
-    gemini_import_exception: Optional[ImportError] = None
+    gemini_import_exception: ImportError | None = None
 else:
     gemini_InternalServerError = gemini_ResourceExhausted = Exception  # noqa: N816
     gemini_import_exception = ImportError("google-genai not found")
@@ -101,7 +103,7 @@ with optional_import_block() as anthropic_result:
     from .anthropic import AnthropicClient
 if anthropic_result.is_successful:
-    anthropic_import_exception: Optional[ImportError] = None
+    anthropic_import_exception: ImportError | None = None
 else:
     anthorpic_InternalServerError = anthorpic_RateLimitError = Exception  # noqa: N816
     anthropic_import_exception = ImportError("anthropic not found")
@@ -115,7 +117,7 @@ with optional_import_block() as mistral_result:
     from .mistral import MistralAIClient
 if mistral_result.is_successful:
-    mistral_import_exception: Optional[ImportError] = None
+    mistral_import_exception: ImportError | None = None
 else:
     mistral_SDKError = mistral_HTTPValidationError = Exception  # noqa: N816
     mistral_import_exception = ImportError("mistralai not found")
@@ -126,7 +128,7 @@ with optional_import_block() as together_result:
     from .together import TogetherClient
 if together_result.is_successful:
-    together_import_exception: Optional[ImportError] = None
+    together_import_exception: ImportError | None = None
 else:
     together_TogetherException = Exception  # noqa: N816
     together_import_exception = ImportError("together not found")
@@ -141,7 +143,7 @@ with optional_import_block() as groq_result:
     from .groq import GroqClient
 if groq_result.is_successful:
-    groq_import_exception: Optional[ImportError] = None
+    groq_import_exception: ImportError | None = None
 else:
     groq_InternalServerError = groq_RateLimitError = groq_APIConnectionError = Exception  # noqa: N816
     groq_import_exception = ImportError("groq not found")
@@ -156,7 +158,7 @@ with optional_import_block() as cohere_result:
     from .cohere import CohereClient
 if cohere_result.is_successful:
-    cohere_import_exception: Optional[ImportError] = None
+    cohere_import_exception: ImportError | None = None
 else:
     cohere_InternalServerError = cohere_TooManyRequestsError = cohere_ServiceUnavailableError = Exception  # noqa: N816
     cohere_import_exception = ImportError("cohere not found")
@@ -170,7 +172,7 @@ with optional_import_block() as ollama_result:
     from .ollama import OllamaClient
 if ollama_result.is_successful:
-    ollama_import_exception: Optional[ImportError] = None
+    ollama_import_exception: ImportError | None = None
 else:
     ollama_RequestError = ollama_ResponseError = Exception  # noqa: N816
     ollama_import_exception = ImportError("ollama not found")
@@ -184,7 +186,7 @@ with optional_import_block() as bedrock_result:
     from .bedrock import BedrockClient
 if bedrock_result.is_successful:
-    bedrock_import_exception: Optional[ImportError] = None
+    bedrock_import_exception: ImportError | None = None
 else:
     bedrock_BotoCoreError = bedrock_ClientError = Exception  # noqa: N816
     bedrock_import_exception = ImportError("botocore not found")
@@ -212,6 +214,7 @@ OPENAI_FALLBACK_KWARGS = {
     "default_query",
     "http_client",
     "_strict_response_validation",
+    "webhook_secret",
 }
 AOPENAI_FALLBACK_KWARGS = {
@@ -231,124 +234,103 @@ AOPENAI_FALLBACK_KWARGS = {
     "_strict_response_validation",
     "base_url",
     "project",
+    "webhook_secret",
 }
 @lru_cache(maxsize=128)
-def log_cache_seed_value(cache_seed_value: Union[str, int], client: "ModelClient") -> None:
+def log_cache_seed_value(cache_seed_value: str | int, client: ModelClient) -> None:
     logger.debug(f"Using cache with seed value {cache_seed_value} for client {client.__class__.__name__}")
-@register_llm_config
+class OpenAIEntryDict(LLMConfigEntryDict, total=False):
+    api_type: Literal["openai"]
+    price: list[float] | None
+    tool_choice: Literal["none", "auto", "required"] | None
+    user: str | None
+    stream: bool
+    verbosity: Literal["low", "medium", "high"] | None
+    extra_body: dict[str, Any] | None
+    reasoning_effort: Literal["low", "minimal", "medium", "high"] | None
+    max_completion_tokens: int | None
 class OpenAILLMConfigEntry(LLMConfigEntry):
     api_type: Literal["openai"] = "openai"
-    top_p: Optional[float] = None
-    price: Optional[list[float]] = Field(default=None, min_length=2, max_length=2)
-    tool_choice: Optional[Literal["none", "auto", "required"]] = None
-    user: Optional[str] = None
-    # ⏺ The extra_body parameter flows from OpenAILLMConfigEntry to the LLM request through this path:
+    price: list[float] | None = Field(default=None, min_length=2, max_length=2)
+    tool_choice: Literal["none", "auto", "required"] | None = None
+    user: str | None = None
+    stream: bool = False
+    verbosity: Literal["low", "medium", "high"] | None = None
+    #   The extra_body parameter flows from OpenAILLMConfigEntry to the LLM request through this path:
     #   1. Config Definition: extra_body is defined in OpenAILLMConfigEntry (autogen/oai/client.py:248)
     #   2. Parameter Classification: It's classified as an OpenAI client parameter (not AG2-specific) via the openai_kwargs property (autogen/oai/client.py:752-758)
     #   3. Request Separation: In _separate_create_config() (autogen/oai/client.py:842), extra_body goes into create_config since it's not in the extra_kwargs set.
     #   4. API Call: The create_config becomes params and gets passed directly to OpenAI's create() method via **params (autogen/oai/client.py:551,658)
-    extra_body: Optional[dict[str, Any]] = (
+    extra_body: dict[str, Any] | None = (
         None  # For VLLM - See here: https://docs.vllm.ai/en/latest/serving/openai_compatible_server.html#extra-parameters
     )
     # reasoning models - see: https://platform.openai.com/docs/api-reference/chat/create#chat-create-reasoning_effort
-    reasoning_effort: Optional[Literal["low", "medium", "high"]] = None
-    max_completion_tokens: Optional[int] = None
+    reasoning_effort: Literal["low", "minimal", "medium", "high"] | None = None
+    max_completion_tokens: int | None = None
-    def create_client(self) -> "ModelClient":
+    def create_client(self) -> ModelClient:
         raise NotImplementedError("create_client method must be implemented in the derived class.")
-@register_llm_config
+class AzureOpenAIEntryDict(LLMConfigEntryDict, total=False):
+    api_type: Literal["azure"]
+    azure_ad_token_provider: str | Callable[[], str] | None
+    stream: bool
+    tool_choice: Literal["none", "auto", "required"] | None
+    user: str | None
+    reasoning_effort: Literal["low", "medium", "high"] | None
+    max_completion_tokens: int | None
 class AzureOpenAILLMConfigEntry(LLMConfigEntry):
     api_type: Literal["azure"] = "azure"
-    top_p: Optional[float] = None
-    azure_ad_token_provider: Optional[Union[str, Callable[[], str]]] = None
-    tool_choice: Optional[Literal["none", "auto", "required"]] = None
-    user: Optional[str] = None
+    azure_ad_token_provider: str | Callable[[], str] | None = None
+    stream: bool = False
+    tool_choice: Literal["none", "auto", "required"] | None = None
+    user: str | None = None
     # reasoning models - see:
     # - https://learn.microsoft.com/en-us/azure/ai-services/openai/how-to/reasoning
     # - https://learn.microsoft.com/en-us/azure/ai-services/openai/reference-preview
-    reasoning_effort: Optional[Literal["low", "medium", "high"]] = None
-    max_completion_tokens: Optional[int] = None
+    reasoning_effort: Literal["low", "medium", "high"] | None = None
+    max_completion_tokens: int | None = None
-    def create_client(self) -> "ModelClient":
+    def create_client(self) -> ModelClient:
         raise NotImplementedError
-@register_llm_config
+class DeepSeekEntyDict(LLMConfigEntryDict, total=False):
+    api_type: Literal["deepseek"]
+    base_url: HttpUrl
+    stream: bool
+    tool_choice: Literal["none", "auto", "required"] | None
 class DeepSeekLLMConfigEntry(LLMConfigEntry):
     api_type: Literal["deepseek"] = "deepseek"
-    base_url: HttpUrl = HttpUrl("https://api.deepseek.com/v1")
-    temperature: float = Field(0.5, ge=0.0, le=1.0)
+    temperature: float | None = Field(default=None, ge=0.0, le=1.0)
+    top_p: float | None = Field(None, ge=0.0, le=1.0)
     max_tokens: int = Field(8192, ge=1, le=8192)
-    top_p: Optional[float] = Field(None, ge=0.0, le=1.0)
-    tool_choice: Optional[Literal["none", "auto", "required"]] = None
-    @field_validator("top_p", mode="before")
-    @classmethod
-    def check_top_p(cls, v: Any, info: ValidationInfo) -> Any:
-        if v is not None and info.data.get("temperature") is not None:
-            raise ValueError("temperature and top_p cannot be set at the same time.")
-        return v
+    base_url: HttpUrl = HttpUrl("https://api.deepseek.com/v1")
+    stream: bool = False
+    tool_choice: Literal["none", "auto", "required"] | None = None
     def create_client(self) -> None:  # type: ignore [override]
         raise NotImplementedError("DeepSeekLLMConfigEntry.create_client is not implemented.")
-@export_module("autogen")
-class ModelClient(Protocol):
-    """A client class must implement the following methods:
-    - create must return a response object that implements the ModelClientResponseProtocol
-    - cost must return the cost of the response
-    - get_usage must return a dict with the following keys:
-        - prompt_tokens
-        - completion_tokens
-        - total_tokens
-        - cost
-        - model
-    This class is used to create a client that can be used by OpenAIWrapper.
-    The response returned from create must adhere to the ModelClientResponseProtocol but can be extended however needed.
-    The message_retrieval method must be implemented to return a list of str or a list of messages from the response.
-    """
-    RESPONSE_USAGE_KEYS = ["prompt_tokens", "completion_tokens", "total_tokens", "cost", "model"]
-    class ModelClientResponseProtocol(Protocol):
-        class Choice(Protocol):
-            class Message(Protocol):
-                content: Optional[str] | Optional[dict[str, Any]]
-            message: Message
-        choices: list[Choice]
-        model: str
-    def create(self, params: dict[str, Any]) -> ModelClientResponseProtocol: ...  # pragma: no cover
-    def message_retrieval(
-        self, response: ModelClientResponseProtocol
-    ) -> Union[list[str], list[ModelClient.ModelClientResponseProtocol.Choice.Message]]:
-        """Retrieve and return a list of strings or a list of Choice.Message from the response.
-        NOTE: if a list of Choice.Message is returned, it currently needs to contain the fields of OpenAI's ChatCompletion Message object,
-        since that is expected for function or tool calling in the rest of the codebase at the moment, unless a custom agent is being used.
-        """
-        ...  # pragma: no cover
-    def cost(self, response: ModelClientResponseProtocol) -> float: ...  # pragma: no cover
-    @staticmethod
-    def get_usage(response: ModelClientResponseProtocol) -> dict:
-        """Return usage summary of the response using RESPONSE_USAGE_KEYS."""
-        ...  # pragma: no cover
 class PlaceHolderClient:
     def __init__(self, config):
         self.config = config
@@ -358,9 +340,7 @@ class PlaceHolderClient:
 class OpenAIClient:
     """Follows the Client protocol and wraps the OpenAI client."""
-    def __init__(
-        self, client: Union[OpenAI, AzureOpenAI], response_format: Union[BaseModel, dict[str, Any], None] = None
-    ):
+    def __init__(self, client: OpenAI | AzureOpenAI, response_format: BaseModel | dict[str, Any] | None = None):
         self._oai_client = client
         self.response_format = response_format
         if (
@@ -372,9 +352,7 @@ class OpenAIClient:
                 "The API key specified is not a valid OpenAI format; it won't work with the OpenAI-hosted model."
             )
-    def message_retrieval(
-        self, response: Union[ChatCompletion, Completion]
-    ) -> Union[list[str], list[ChatCompletionMessage]]:
+    def message_retrieval(self, response: ChatCompletion | Completion) -> list[str] | list[ChatCompletionMessage]:
         """Retrieve the messages from the response.
         Args:
@@ -511,7 +489,10 @@ class OpenAIClient:
                 if "stream" in kwargs:
                     kwargs.pop("stream")
-                if isinstance(kwargs["response_format"], dict):
+                if (
+                    isinstance(kwargs["response_format"], dict)
+                    and kwargs["response_format"].get("type") != "json_object"
+                ):
                     kwargs["response_format"] = {
                         "type": "json_schema",
                         "json_schema": {
@@ -550,8 +531,8 @@ class OpenAIClient:
             completion_tokens = 0
             # Prepare for potential function call
-            full_function_call: Optional[dict[str, Any]] = None
-            full_tool_calls: Optional[list[Optional[dict[str, Any]]]] = None
+            full_function_call: dict[str, Any] | None = None
+            full_tool_calls: list[dict[str, Any] | None] | None = None
             # Send the chat completion request to OpenAI's API and process the response in chunks
             for chunk in create_or_parse(**params):
@@ -678,9 +659,9 @@ class OpenAIClient:
         # Unsupported parameters
         unsupported_params = [
             "temperature",
+            "top_p",
             "frequency_penalty",
             "presence_penalty",
-            "top_p",
             "logprobs",
             "top_logprobs",
             "logit_bias",
@@ -706,7 +687,7 @@ class OpenAIClient:
                     msg["role"] = "user"
                     msg["content"] = f"System message: {msg['content']}"
-    def cost(self, response: Union[ChatCompletion, Completion]) -> float:
+    def cost(self, response: ChatCompletion | Completion) -> float:
         """Calculate the cost of the response."""
         model = response.model
         if model not in OAI_PRICE1K:
@@ -727,7 +708,7 @@ class OpenAIClient:
         return tmp_price1K * (n_input_tokens + n_output_tokens) / 1000  # type: ignore [operator]
     @staticmethod
-    def get_usage(response: Union[ChatCompletion, Completion]) -> dict:
+    def get_usage(response: ChatCompletion | Completion) -> dict:
         return {
             "prompt_tokens": response.usage.prompt_tokens if response.usage is not None else 0,
             "completion_tokens": response.usage.completion_tokens if response.usage is not None else 0,
@@ -763,13 +744,13 @@ class OpenAIWrapper:
         else:
             return OPENAI_FALLBACK_KWARGS | AOPENAI_FALLBACK_KWARGS
-    total_usage_summary: Optional[dict[str, Any]] = None
-    actual_usage_summary: Optional[dict[str, Any]] = None
+    total_usage_summary: dict[str, Any] | None = None
+    actual_usage_summary: dict[str, Any] | None = None
     def __init__(
         self,
         *,
-        config_list: Optional[list[dict[str, Any]]] = None,
+        config_list: list[dict[str, Any]] | None = None,
         **base_config: Any,
     ):
         """Initialize the OpenAIWrapper.
@@ -851,17 +832,6 @@ class OpenAIWrapper:
     def _configure_azure_openai(self, config: dict[str, Any], openai_config: dict[str, Any]) -> None:
         openai_config["azure_deployment"] = openai_config.get("azure_deployment", config.get("model"))
-        if openai_config["azure_deployment"] is not None:
-            # Preserve dots for specific model versions that require them
-            deployment_name = openai_config["azure_deployment"]
-            if deployment_name in [
-                "gpt-4.1"
-            ]:  # Add more as needed, Whitelist approach so as to not break existing deployments
-                # Keep the deployment name as-is for these specific models
-                pass
-            else:
-                # Remove dots for all other models (maintain existing behavior)
-                openai_config["azure_deployment"] = deployment_name.replace(".", "")
         openai_config["azure_endpoint"] = openai_config.get("azure_endpoint", openai_config.pop("base_url", None))
         # Create a default Azure token provider if requested
@@ -890,6 +860,13 @@ class OpenAIWrapper:
             if key in config:
                 openai_config[key] = config[key]
+    def _configure_openai_config_for_gemini(self, config: dict[str, Any], openai_config: dict[str, Any]) -> None:
+        """Update openai_config with additional gemini genai configs."""
+        optional_keys = ["proxy"]
+        for key in optional_keys:
+            if key in config:
+                openai_config[key] = config[key]
     def _register_default_client(self, config: dict[str, Any], openai_config: dict[str, Any]) -> None:
         """Create a client with the given config to override openai_config,
         after removing extra kwargs.
@@ -915,7 +892,7 @@ class OpenAIWrapper:
             if api_type is not None and api_type.startswith("azure"):
                 @require_optional_import("openai>=1.66.2", "openai")
-                def create_azure_openai_client() -> "AzureOpenAI":
+                def create_azure_openai_client() -> AzureOpenAI:
                     self._configure_azure_openai(config, openai_config)
                     client = AzureOpenAI(**openai_config)
                     self._clients.append(OpenAIClient(client, response_format=response_format))
@@ -930,6 +907,7 @@ class OpenAIWrapper:
             elif api_type is not None and api_type.startswith("google"):
                 if gemini_import_exception:
                     raise ImportError("Please install `google-genai` and 'vertexai' to use Google's API.")
+                self._configure_openai_config_for_gemini(config, openai_config)
                 client = GeminiClient(response_format=response_format, **openai_config)
                 self._clients.append(client)
             elif api_type is not None and api_type.startswith("anthropic"):
@@ -975,7 +953,7 @@ class OpenAIWrapper:
             elif api_type is not None and api_type.startswith("responses"):
                 # OpenAI Responses API (stateful). Reuse the same OpenAI SDK but call the `/responses` endpoint via the new client.
                 @require_optional_import("openai>=1.66.2", "openai")
-                def create_responses_client() -> "OpenAI":
+                def create_responses_client() -> OpenAI:
                     client = OpenAI(**openai_config)
                     self._clients.append(OpenAIResponsesClient(client, response_format=response_format))
                     return client
@@ -984,7 +962,7 @@ class OpenAIWrapper:
             else:
                 @require_optional_import("openai>=1.66.2", "openai")
-                def create_openai_client() -> "OpenAI":
+                def create_openai_client() -> OpenAI:
                     client = OpenAI(**openai_config)
                     self._clients.append(OpenAIClient(client, response_format))
                     return client
@@ -1025,10 +1003,10 @@ class OpenAIWrapper:
     @classmethod
     def instantiate(
         cls,
-        template: Optional[Union[str, Callable[[dict[str, Any]], str]]],
-        context: Optional[dict[str, Any]] = None,
-        allow_format_str_template: Optional[bool] = False,
-    ) -> Optional[str]:
+        template: str | Callable[[dict[str, Any]], str] | None,
+        context: dict[str, Any] | None = None,
+        allow_format_str_template: bool | None = False,
+    ) -> str | None:
         if not context or template is None:
             return template  # type: ignore [return-value]
         if isinstance(template, str):
@@ -1038,8 +1016,8 @@ class OpenAIWrapper:
     def _construct_create_params(self, create_config: dict[str, Any], extra_kwargs: dict[str, Any]) -> dict[str, Any]:
         """Prime the create_config with additional_kwargs."""
         # Validate the config
-        prompt: Optional[str] = create_config.get("prompt")
-        messages: Optional[list[dict[str, Any]]] = create_config.get("messages")
+        prompt: str | None = create_config.get("prompt")
+        messages: list[dict[str, Any]] | None = create_config.get("messages")
         if (prompt is None) == (messages is None):
             raise ValueError("Either prompt or messages should be in create config but not both.")
         context = extra_kwargs.get("context")
@@ -1106,9 +1084,6 @@ class OpenAIWrapper:
             full_config = {**config, **self._config_list[i]}
             # separate the config into create_config and extra_kwargs
             create_config, extra_kwargs = self._separate_create_config(full_config)
-            api_type = extra_kwargs.get("api_type")
-            if api_type and api_type.startswith("azure") and "model" in create_config:
-                create_config["model"] = create_config["model"].replace(".", "")
             # construct the create params
             params = self._construct_create_params(create_config, extra_kwargs)
             # get the cache_seed, filter_func and context
@@ -1336,8 +1311,8 @@ class OpenAIWrapper:
     @staticmethod
     def _update_function_call_from_chunk(
-        function_call_chunk: Union[ChoiceDeltaToolCallFunction, ChoiceDeltaFunctionCall],
-        full_function_call: Optional[dict[str, Any]],
+        function_call_chunk: ChoiceDeltaToolCallFunction | ChoiceDeltaFunctionCall,
+        full_function_call: dict[str, Any] | None,
         completion_tokens: int,
     ) -> tuple[dict[str, Any], int]:
         """Update the function call from the chunk.
@@ -1368,7 +1343,7 @@ class OpenAIWrapper:
     @staticmethod
     def _update_tool_calls_from_chunk(
         tool_calls_chunk: ChoiceDeltaToolCall,
-        full_tool_call: Optional[dict[str, Any]],
+        full_tool_call: dict[str, Any] | None,
         completion_tokens: int,
     ) -> tuple[dict[str, Any], int]:
         """Update the tool call from the chunk.
@@ -1442,7 +1417,7 @@ class OpenAIWrapper:
         if actual_usage is not None:
             self.actual_usage_summary = update_usage(self.actual_usage_summary, actual_usage)
-    def print_usage_summary(self, mode: Union[str, list[str]] = ["actual", "total"]) -> None:
+    def print_usage_summary(self, mode: str | list[str] = ["actual", "total"]) -> None:
         """Print the usage summary."""
         iostream = IOStream.get_default()
@@ -1470,7 +1445,7 @@ class OpenAIWrapper:
     @classmethod
     def extract_text_or_completion_object(
         cls, response: ModelClient.ModelClientResponseProtocol
-    ) -> Union[list[str], list[ModelClient.ModelClientResponseProtocol.Choice.Message]]:
+    ) -> list[str] | list[ModelClient.ModelClientResponseProtocol.Choice.Message]:
         """Extract the text or ChatCompletion objects from a completion or chat response.
         Args:
@@ -1487,7 +1462,6 @@ class OpenAIWrapper:
 # -----------------------------------------------------------------------------
-@register_llm_config
 class OpenAIResponsesLLMConfigEntry(OpenAILLMConfigEntry):
     """LLMConfig entry for the OpenAI Responses API (stateful, tool-enabled).
@@ -1507,8 +1481,8 @@ class OpenAIResponsesLLMConfigEntry(OpenAILLMConfigEntry):
     """
     api_type: Literal["responses"] = "responses"
-    tool_choice: Optional[Literal["none", "auto", "required"]] = "auto"
-    built_in_tools: Optional[list[str]] = None
+    tool_choice: Literal["none", "auto", "required"] | None = "auto"
+    built_in_tools: list[str] | None = None
-    def create_client(self) -> "ModelClient":  # pragma: no cover
+    def create_client(self) -> ModelClient:  # pragma: no cover
         raise NotImplementedError("Handled via OpenAIWrapper._register_default_client")

autogen/oai/client_utils.py CHANGED Viewed

@@ -8,7 +8,7 @@
 import logging
 import warnings
-from typing import Any, Optional, Protocol, runtime_checkable
+from typing import Any, Protocol, runtime_checkable
 @runtime_checkable
@@ -24,8 +24,8 @@ def validate_parameter(
     allowed_types: tuple[Any, ...],
     allow_None: bool,  # noqa: N803
     default_value: Any,
-    numerical_bound: Optional[tuple[Optional[float], Optional[float]]],
-    allowed_values: Optional[list[Any]],
+    numerical_bound: tuple[float | None, float | None] | None,
+    allowed_values: list[Any] | None,
 ) -> Any:
     """Validates a given config parameter, checking its type, values, and setting defaults
     Parameters:

autogen/oai/cohere.py CHANGED Viewed

@@ -34,14 +34,15 @@ import os
 import sys
 import time
 import warnings
-from typing import Any, Literal, Optional, Type
+from typing import Any, Literal
 from pydantic import BaseModel, Field
+from typing_extensions import Unpack
 from autogen.oai.client_utils import FormatterProtocol, logging_formatter, validate_parameter
 from ..import_utils import optional_import_block, require_optional_import
-from ..llm_config import LLMConfigEntry, register_llm_config
+from ..llm_config.entry import LLMConfigEntry, LLMConfigEntryDict
 from .oai_models import ChatCompletion, ChatCompletionMessage, ChatCompletionMessageToolCall, Choice, CompletionUsage
 with optional_import_block():
@@ -66,20 +67,30 @@ COHERE_PRICING_1K = {
 }
-@register_llm_config
+class CohereEntryDict(LLMConfigEntryDict, total=False):
+    api_type: Literal["cohere"]
+    k: int
+    seed: int | None
+    frequency_penalty: float
+    presence_penalty: float
+    client_name: str | None
+    strict_tools: bool
+    stream: bool
+    tool_choice: Literal["NONE", "REQUIRED"] | None
 class CohereLLMConfigEntry(LLMConfigEntry):
     api_type: Literal["cohere"] = "cohere"
-    temperature: float = Field(default=0.3, ge=0)
-    max_tokens: Optional[int] = Field(default=None, ge=0)
     k: int = Field(default=0, ge=0, le=500)
-    p: float = Field(default=0.75, ge=0.01, le=0.99)
-    seed: Optional[int] = None
+    seed: int | None = None
     frequency_penalty: float = Field(default=0, ge=0, le=1)
     presence_penalty: float = Field(default=0, ge=0, le=1)
-    client_name: Optional[str] = None
+    client_name: str | None = None
     strict_tools: bool = False
     stream: bool = False
-    tool_choice: Optional[Literal["NONE", "REQUIRED"]] = None
+    tool_choice: Literal["NONE", "REQUIRED"] | None = None
     def create_client(self):
         raise NotImplementedError("CohereLLMConfigEntry.create_client is not implemented.")
@@ -88,7 +99,7 @@ class CohereLLMConfigEntry(LLMConfigEntry):
 class CohereClient:
     """Client for Cohere's API."""
-    def __init__(self, **kwargs):
+    def __init__(self, **kwargs: Unpack[CohereEntryDict]):
         """Requires api_key or environment variable to be set
         Args:
@@ -104,7 +115,7 @@ class CohereClient:
         )
         # Store the response format, if provided (for structured outputs)
-        self._response_format: Optional[Type[BaseModel]] = None
+        self._response_format: type[BaseModel] | None = None
     def message_retrieval(self, response) -> list:
         """Retrieve and return a list of strings or a list of Choice.Message from the response.
@@ -203,7 +214,17 @@ class CohereClient:
         if "k" in params:
             cohere_params["k"] = validate_parameter(params, "k", int, False, 0, (0, 500), None)
+        if "top_p" in params:
+            cohere_params["p"] = validate_parameter(params, "top_p", (int, float), False, 0.75, (0.01, 0.99), None)
         if "p" in params:
+            warnings.warn(
+                (
+                    "parameter 'p' is deprecated, use 'top_p' instead for consistency with OpenAI API spec. "
+                    "Scheduled for removal in 0.10.0 version."
+                ),
+                DeprecationWarning,
+            )
             cohere_params["p"] = validate_parameter(params, "p", (int, float), False, 0.75, (0.01, 0.99), None)
         if "seed" in params:
@@ -402,8 +423,10 @@ class CohereClient:
     def _convert_json_response(self, response: str) -> Any:
         """Extract and validate JSON response from the output for structured outputs.
         Args:
             response (str): The response from the API.
         Returns:
             Any: The parsed JSON response.
         """

ag2 0.9.7__py3-none-any.whl → 0.9.9__py3-none-any.whl

Potentially problematic release.

ag2 0.9.7py3-none-any.whl → 0.9.9py3-none-any.whl