ag2 0.9.1__py3-none-any.whl → 0.9.1.post0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of ag2 might be problematic. Click here for more details.
- {ag2-0.9.1.dist-info → ag2-0.9.1.post0.dist-info}/METADATA +264 -73
- ag2-0.9.1.post0.dist-info/RECORD +392 -0
- {ag2-0.9.1.dist-info → ag2-0.9.1.post0.dist-info}/WHEEL +1 -2
- autogen/__init__.py +89 -0
- autogen/_website/__init__.py +3 -0
- autogen/_website/generate_api_references.py +427 -0
- autogen/_website/generate_mkdocs.py +1174 -0
- autogen/_website/notebook_processor.py +476 -0
- autogen/_website/process_notebooks.py +656 -0
- autogen/_website/utils.py +412 -0
- autogen/agentchat/__init__.py +44 -0
- autogen/agentchat/agent.py +182 -0
- autogen/agentchat/assistant_agent.py +85 -0
- autogen/agentchat/chat.py +309 -0
- autogen/agentchat/contrib/__init__.py +5 -0
- autogen/agentchat/contrib/agent_eval/README.md +7 -0
- autogen/agentchat/contrib/agent_eval/agent_eval.py +108 -0
- autogen/agentchat/contrib/agent_eval/criterion.py +43 -0
- autogen/agentchat/contrib/agent_eval/critic_agent.py +44 -0
- autogen/agentchat/contrib/agent_eval/quantifier_agent.py +39 -0
- autogen/agentchat/contrib/agent_eval/subcritic_agent.py +45 -0
- autogen/agentchat/contrib/agent_eval/task.py +42 -0
- autogen/agentchat/contrib/agent_optimizer.py +429 -0
- autogen/agentchat/contrib/capabilities/__init__.py +5 -0
- autogen/agentchat/contrib/capabilities/agent_capability.py +20 -0
- autogen/agentchat/contrib/capabilities/generate_images.py +301 -0
- autogen/agentchat/contrib/capabilities/teachability.py +393 -0
- autogen/agentchat/contrib/capabilities/text_compressors.py +66 -0
- autogen/agentchat/contrib/capabilities/tools_capability.py +22 -0
- autogen/agentchat/contrib/capabilities/transform_messages.py +93 -0
- autogen/agentchat/contrib/capabilities/transforms.py +566 -0
- autogen/agentchat/contrib/capabilities/transforms_util.py +122 -0
- autogen/agentchat/contrib/capabilities/vision_capability.py +214 -0
- autogen/agentchat/contrib/captainagent/__init__.py +9 -0
- autogen/agentchat/contrib/captainagent/agent_builder.py +790 -0
- autogen/agentchat/contrib/captainagent/captainagent.py +512 -0
- autogen/agentchat/contrib/captainagent/tool_retriever.py +335 -0
- autogen/agentchat/contrib/captainagent/tools/README.md +44 -0
- autogen/agentchat/contrib/captainagent/tools/__init__.py +5 -0
- autogen/agentchat/contrib/captainagent/tools/data_analysis/calculate_correlation.py +40 -0
- autogen/agentchat/contrib/captainagent/tools/data_analysis/calculate_skewness_and_kurtosis.py +28 -0
- autogen/agentchat/contrib/captainagent/tools/data_analysis/detect_outlier_iqr.py +28 -0
- autogen/agentchat/contrib/captainagent/tools/data_analysis/detect_outlier_zscore.py +28 -0
- autogen/agentchat/contrib/captainagent/tools/data_analysis/explore_csv.py +21 -0
- autogen/agentchat/contrib/captainagent/tools/data_analysis/shapiro_wilk_test.py +30 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/arxiv_download.py +27 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/arxiv_search.py +53 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/extract_pdf_image.py +53 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/extract_pdf_text.py +38 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/get_wikipedia_text.py +21 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/get_youtube_caption.py +34 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/image_qa.py +60 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/optical_character_recognition.py +61 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/perform_web_search.py +47 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/scrape_wikipedia_tables.py +33 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/transcribe_audio_file.py +21 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/youtube_download.py +35 -0
- autogen/agentchat/contrib/captainagent/tools/math/calculate_circle_area_from_diameter.py +21 -0
- autogen/agentchat/contrib/captainagent/tools/math/calculate_day_of_the_week.py +18 -0
- autogen/agentchat/contrib/captainagent/tools/math/calculate_fraction_sum.py +28 -0
- autogen/agentchat/contrib/captainagent/tools/math/calculate_matrix_power.py +31 -0
- autogen/agentchat/contrib/captainagent/tools/math/calculate_reflected_point.py +16 -0
- autogen/agentchat/contrib/captainagent/tools/math/complex_numbers_product.py +25 -0
- autogen/agentchat/contrib/captainagent/tools/math/compute_currency_conversion.py +23 -0
- autogen/agentchat/contrib/captainagent/tools/math/count_distinct_permutations.py +27 -0
- autogen/agentchat/contrib/captainagent/tools/math/evaluate_expression.py +28 -0
- autogen/agentchat/contrib/captainagent/tools/math/find_continuity_point.py +34 -0
- autogen/agentchat/contrib/captainagent/tools/math/fraction_to_mixed_numbers.py +39 -0
- autogen/agentchat/contrib/captainagent/tools/math/modular_inverse_sum.py +23 -0
- autogen/agentchat/contrib/captainagent/tools/math/simplify_mixed_numbers.py +36 -0
- autogen/agentchat/contrib/captainagent/tools/math/sum_of_digit_factorials.py +15 -0
- autogen/agentchat/contrib/captainagent/tools/math/sum_of_primes_below.py +15 -0
- autogen/agentchat/contrib/captainagent/tools/requirements.txt +10 -0
- autogen/agentchat/contrib/captainagent/tools/tool_description.tsv +34 -0
- autogen/agentchat/contrib/gpt_assistant_agent.py +526 -0
- autogen/agentchat/contrib/graph_rag/__init__.py +9 -0
- autogen/agentchat/contrib/graph_rag/document.py +29 -0
- autogen/agentchat/contrib/graph_rag/falkor_graph_query_engine.py +170 -0
- autogen/agentchat/contrib/graph_rag/falkor_graph_rag_capability.py +103 -0
- autogen/agentchat/contrib/graph_rag/graph_query_engine.py +53 -0
- autogen/agentchat/contrib/graph_rag/graph_rag_capability.py +63 -0
- autogen/agentchat/contrib/graph_rag/neo4j_graph_query_engine.py +268 -0
- autogen/agentchat/contrib/graph_rag/neo4j_graph_rag_capability.py +83 -0
- autogen/agentchat/contrib/graph_rag/neo4j_native_graph_query_engine.py +210 -0
- autogen/agentchat/contrib/graph_rag/neo4j_native_graph_rag_capability.py +93 -0
- autogen/agentchat/contrib/img_utils.py +397 -0
- autogen/agentchat/contrib/llamaindex_conversable_agent.py +117 -0
- autogen/agentchat/contrib/llava_agent.py +187 -0
- autogen/agentchat/contrib/math_user_proxy_agent.py +464 -0
- autogen/agentchat/contrib/multimodal_conversable_agent.py +125 -0
- autogen/agentchat/contrib/qdrant_retrieve_user_proxy_agent.py +324 -0
- autogen/agentchat/contrib/rag/__init__.py +10 -0
- autogen/agentchat/contrib/rag/chromadb_query_engine.py +272 -0
- autogen/agentchat/contrib/rag/llamaindex_query_engine.py +198 -0
- autogen/agentchat/contrib/rag/mongodb_query_engine.py +329 -0
- autogen/agentchat/contrib/rag/query_engine.py +74 -0
- autogen/agentchat/contrib/retrieve_assistant_agent.py +56 -0
- autogen/agentchat/contrib/retrieve_user_proxy_agent.py +703 -0
- autogen/agentchat/contrib/society_of_mind_agent.py +199 -0
- autogen/agentchat/contrib/swarm_agent.py +1425 -0
- autogen/agentchat/contrib/text_analyzer_agent.py +79 -0
- autogen/agentchat/contrib/vectordb/__init__.py +5 -0
- autogen/agentchat/contrib/vectordb/base.py +232 -0
- autogen/agentchat/contrib/vectordb/chromadb.py +315 -0
- autogen/agentchat/contrib/vectordb/couchbase.py +407 -0
- autogen/agentchat/contrib/vectordb/mongodb.py +550 -0
- autogen/agentchat/contrib/vectordb/pgvectordb.py +928 -0
- autogen/agentchat/contrib/vectordb/qdrant.py +320 -0
- autogen/agentchat/contrib/vectordb/utils.py +126 -0
- autogen/agentchat/contrib/web_surfer.py +303 -0
- autogen/agentchat/conversable_agent.py +4020 -0
- autogen/agentchat/group/__init__.py +64 -0
- autogen/agentchat/group/available_condition.py +91 -0
- autogen/agentchat/group/context_condition.py +77 -0
- autogen/agentchat/group/context_expression.py +238 -0
- autogen/agentchat/group/context_str.py +41 -0
- autogen/agentchat/group/context_variables.py +192 -0
- autogen/agentchat/group/group_tool_executor.py +202 -0
- autogen/agentchat/group/group_utils.py +591 -0
- autogen/agentchat/group/handoffs.py +244 -0
- autogen/agentchat/group/llm_condition.py +93 -0
- autogen/agentchat/group/multi_agent_chat.py +237 -0
- autogen/agentchat/group/on_condition.py +58 -0
- autogen/agentchat/group/on_context_condition.py +54 -0
- autogen/agentchat/group/patterns/__init__.py +18 -0
- autogen/agentchat/group/patterns/auto.py +159 -0
- autogen/agentchat/group/patterns/manual.py +176 -0
- autogen/agentchat/group/patterns/pattern.py +288 -0
- autogen/agentchat/group/patterns/random.py +106 -0
- autogen/agentchat/group/patterns/round_robin.py +117 -0
- autogen/agentchat/group/reply_result.py +26 -0
- autogen/agentchat/group/speaker_selection_result.py +41 -0
- autogen/agentchat/group/targets/__init__.py +4 -0
- autogen/agentchat/group/targets/group_chat_target.py +132 -0
- autogen/agentchat/group/targets/group_manager_target.py +151 -0
- autogen/agentchat/group/targets/transition_target.py +413 -0
- autogen/agentchat/group/targets/transition_utils.py +6 -0
- autogen/agentchat/groupchat.py +1694 -0
- autogen/agentchat/realtime/__init__.py +3 -0
- autogen/agentchat/realtime/experimental/__init__.py +20 -0
- autogen/agentchat/realtime/experimental/audio_adapters/__init__.py +8 -0
- autogen/agentchat/realtime/experimental/audio_adapters/twilio_audio_adapter.py +148 -0
- autogen/agentchat/realtime/experimental/audio_adapters/websocket_audio_adapter.py +139 -0
- autogen/agentchat/realtime/experimental/audio_observer.py +42 -0
- autogen/agentchat/realtime/experimental/clients/__init__.py +15 -0
- autogen/agentchat/realtime/experimental/clients/gemini/__init__.py +7 -0
- autogen/agentchat/realtime/experimental/clients/gemini/client.py +274 -0
- autogen/agentchat/realtime/experimental/clients/oai/__init__.py +8 -0
- autogen/agentchat/realtime/experimental/clients/oai/base_client.py +220 -0
- autogen/agentchat/realtime/experimental/clients/oai/rtc_client.py +243 -0
- autogen/agentchat/realtime/experimental/clients/oai/utils.py +48 -0
- autogen/agentchat/realtime/experimental/clients/realtime_client.py +190 -0
- autogen/agentchat/realtime/experimental/function_observer.py +85 -0
- autogen/agentchat/realtime/experimental/realtime_agent.py +158 -0
- autogen/agentchat/realtime/experimental/realtime_events.py +42 -0
- autogen/agentchat/realtime/experimental/realtime_observer.py +100 -0
- autogen/agentchat/realtime/experimental/realtime_swarm.py +475 -0
- autogen/agentchat/realtime/experimental/websockets.py +21 -0
- autogen/agentchat/realtime_agent/__init__.py +21 -0
- autogen/agentchat/user_proxy_agent.py +111 -0
- autogen/agentchat/utils.py +206 -0
- autogen/agents/__init__.py +3 -0
- autogen/agents/contrib/__init__.py +10 -0
- autogen/agents/contrib/time/__init__.py +8 -0
- autogen/agents/contrib/time/time_reply_agent.py +73 -0
- autogen/agents/contrib/time/time_tool_agent.py +51 -0
- autogen/agents/experimental/__init__.py +27 -0
- autogen/agents/experimental/deep_research/__init__.py +7 -0
- autogen/agents/experimental/deep_research/deep_research.py +52 -0
- autogen/agents/experimental/discord/__init__.py +7 -0
- autogen/agents/experimental/discord/discord.py +66 -0
- autogen/agents/experimental/document_agent/__init__.py +19 -0
- autogen/agents/experimental/document_agent/chroma_query_engine.py +316 -0
- autogen/agents/experimental/document_agent/docling_doc_ingest_agent.py +118 -0
- autogen/agents/experimental/document_agent/document_agent.py +461 -0
- autogen/agents/experimental/document_agent/document_conditions.py +50 -0
- autogen/agents/experimental/document_agent/document_utils.py +380 -0
- autogen/agents/experimental/document_agent/inmemory_query_engine.py +220 -0
- autogen/agents/experimental/document_agent/parser_utils.py +130 -0
- autogen/agents/experimental/document_agent/url_utils.py +426 -0
- autogen/agents/experimental/reasoning/__init__.py +7 -0
- autogen/agents/experimental/reasoning/reasoning_agent.py +1178 -0
- autogen/agents/experimental/slack/__init__.py +7 -0
- autogen/agents/experimental/slack/slack.py +73 -0
- autogen/agents/experimental/telegram/__init__.py +7 -0
- autogen/agents/experimental/telegram/telegram.py +77 -0
- autogen/agents/experimental/websurfer/__init__.py +7 -0
- autogen/agents/experimental/websurfer/websurfer.py +62 -0
- autogen/agents/experimental/wikipedia/__init__.py +7 -0
- autogen/agents/experimental/wikipedia/wikipedia.py +90 -0
- autogen/browser_utils.py +309 -0
- autogen/cache/__init__.py +10 -0
- autogen/cache/abstract_cache_base.py +75 -0
- autogen/cache/cache.py +203 -0
- autogen/cache/cache_factory.py +88 -0
- autogen/cache/cosmos_db_cache.py +144 -0
- autogen/cache/disk_cache.py +102 -0
- autogen/cache/in_memory_cache.py +58 -0
- autogen/cache/redis_cache.py +123 -0
- autogen/code_utils.py +596 -0
- autogen/coding/__init__.py +22 -0
- autogen/coding/base.py +119 -0
- autogen/coding/docker_commandline_code_executor.py +268 -0
- autogen/coding/factory.py +47 -0
- autogen/coding/func_with_reqs.py +202 -0
- autogen/coding/jupyter/__init__.py +23 -0
- autogen/coding/jupyter/base.py +36 -0
- autogen/coding/jupyter/docker_jupyter_server.py +167 -0
- autogen/coding/jupyter/embedded_ipython_code_executor.py +182 -0
- autogen/coding/jupyter/import_utils.py +82 -0
- autogen/coding/jupyter/jupyter_client.py +231 -0
- autogen/coding/jupyter/jupyter_code_executor.py +160 -0
- autogen/coding/jupyter/local_jupyter_server.py +172 -0
- autogen/coding/local_commandline_code_executor.py +405 -0
- autogen/coding/markdown_code_extractor.py +45 -0
- autogen/coding/utils.py +56 -0
- autogen/doc_utils.py +34 -0
- autogen/events/__init__.py +7 -0
- autogen/events/agent_events.py +1010 -0
- autogen/events/base_event.py +99 -0
- autogen/events/client_events.py +167 -0
- autogen/events/helpers.py +36 -0
- autogen/events/print_event.py +46 -0
- autogen/exception_utils.py +73 -0
- autogen/extensions/__init__.py +5 -0
- autogen/fast_depends/__init__.py +16 -0
- autogen/fast_depends/_compat.py +80 -0
- autogen/fast_depends/core/__init__.py +14 -0
- autogen/fast_depends/core/build.py +225 -0
- autogen/fast_depends/core/model.py +576 -0
- autogen/fast_depends/dependencies/__init__.py +15 -0
- autogen/fast_depends/dependencies/model.py +29 -0
- autogen/fast_depends/dependencies/provider.py +39 -0
- autogen/fast_depends/library/__init__.py +10 -0
- autogen/fast_depends/library/model.py +46 -0
- autogen/fast_depends/py.typed +6 -0
- autogen/fast_depends/schema.py +66 -0
- autogen/fast_depends/use.py +280 -0
- autogen/fast_depends/utils.py +187 -0
- autogen/formatting_utils.py +83 -0
- autogen/function_utils.py +13 -0
- autogen/graph_utils.py +178 -0
- autogen/import_utils.py +526 -0
- autogen/interop/__init__.py +22 -0
- autogen/interop/crewai/__init__.py +7 -0
- autogen/interop/crewai/crewai.py +88 -0
- autogen/interop/interoperability.py +71 -0
- autogen/interop/interoperable.py +46 -0
- autogen/interop/langchain/__init__.py +8 -0
- autogen/interop/langchain/langchain_chat_model_factory.py +155 -0
- autogen/interop/langchain/langchain_tool.py +82 -0
- autogen/interop/litellm/__init__.py +7 -0
- autogen/interop/litellm/litellm_config_factory.py +113 -0
- autogen/interop/pydantic_ai/__init__.py +7 -0
- autogen/interop/pydantic_ai/pydantic_ai.py +168 -0
- autogen/interop/registry.py +69 -0
- autogen/io/__init__.py +15 -0
- autogen/io/base.py +151 -0
- autogen/io/console.py +56 -0
- autogen/io/processors/__init__.py +12 -0
- autogen/io/processors/base.py +21 -0
- autogen/io/processors/console_event_processor.py +56 -0
- autogen/io/run_response.py +293 -0
- autogen/io/thread_io_stream.py +63 -0
- autogen/io/websockets.py +213 -0
- autogen/json_utils.py +43 -0
- autogen/llm_config.py +379 -0
- autogen/logger/__init__.py +11 -0
- autogen/logger/base_logger.py +128 -0
- autogen/logger/file_logger.py +261 -0
- autogen/logger/logger_factory.py +42 -0
- autogen/logger/logger_utils.py +57 -0
- autogen/logger/sqlite_logger.py +523 -0
- autogen/math_utils.py +339 -0
- autogen/mcp/__init__.py +7 -0
- autogen/mcp/mcp_client.py +208 -0
- autogen/messages/__init__.py +7 -0
- autogen/messages/agent_messages.py +948 -0
- autogen/messages/base_message.py +107 -0
- autogen/messages/client_messages.py +171 -0
- autogen/messages/print_message.py +49 -0
- autogen/oai/__init__.py +53 -0
- autogen/oai/anthropic.py +714 -0
- autogen/oai/bedrock.py +628 -0
- autogen/oai/cerebras.py +299 -0
- autogen/oai/client.py +1435 -0
- autogen/oai/client_utils.py +169 -0
- autogen/oai/cohere.py +479 -0
- autogen/oai/gemini.py +990 -0
- autogen/oai/gemini_types.py +129 -0
- autogen/oai/groq.py +305 -0
- autogen/oai/mistral.py +303 -0
- autogen/oai/oai_models/__init__.py +11 -0
- autogen/oai/oai_models/_models.py +16 -0
- autogen/oai/oai_models/chat_completion.py +87 -0
- autogen/oai/oai_models/chat_completion_audio.py +32 -0
- autogen/oai/oai_models/chat_completion_message.py +86 -0
- autogen/oai/oai_models/chat_completion_message_tool_call.py +37 -0
- autogen/oai/oai_models/chat_completion_token_logprob.py +63 -0
- autogen/oai/oai_models/completion_usage.py +60 -0
- autogen/oai/ollama.py +643 -0
- autogen/oai/openai_utils.py +881 -0
- autogen/oai/together.py +370 -0
- autogen/retrieve_utils.py +491 -0
- autogen/runtime_logging.py +160 -0
- autogen/token_count_utils.py +267 -0
- autogen/tools/__init__.py +20 -0
- autogen/tools/contrib/__init__.py +9 -0
- autogen/tools/contrib/time/__init__.py +7 -0
- autogen/tools/contrib/time/time.py +41 -0
- autogen/tools/dependency_injection.py +254 -0
- autogen/tools/experimental/__init__.py +43 -0
- autogen/tools/experimental/browser_use/__init__.py +7 -0
- autogen/tools/experimental/browser_use/browser_use.py +161 -0
- autogen/tools/experimental/crawl4ai/__init__.py +7 -0
- autogen/tools/experimental/crawl4ai/crawl4ai.py +153 -0
- autogen/tools/experimental/deep_research/__init__.py +7 -0
- autogen/tools/experimental/deep_research/deep_research.py +328 -0
- autogen/tools/experimental/duckduckgo/__init__.py +7 -0
- autogen/tools/experimental/duckduckgo/duckduckgo_search.py +109 -0
- autogen/tools/experimental/google/__init__.py +14 -0
- autogen/tools/experimental/google/authentication/__init__.py +11 -0
- autogen/tools/experimental/google/authentication/credentials_hosted_provider.py +43 -0
- autogen/tools/experimental/google/authentication/credentials_local_provider.py +91 -0
- autogen/tools/experimental/google/authentication/credentials_provider.py +35 -0
- autogen/tools/experimental/google/drive/__init__.py +9 -0
- autogen/tools/experimental/google/drive/drive_functions.py +124 -0
- autogen/tools/experimental/google/drive/toolkit.py +88 -0
- autogen/tools/experimental/google/model.py +17 -0
- autogen/tools/experimental/google/toolkit_protocol.py +19 -0
- autogen/tools/experimental/google_search/__init__.py +8 -0
- autogen/tools/experimental/google_search/google_search.py +93 -0
- autogen/tools/experimental/google_search/youtube_search.py +181 -0
- autogen/tools/experimental/messageplatform/__init__.py +17 -0
- autogen/tools/experimental/messageplatform/discord/__init__.py +7 -0
- autogen/tools/experimental/messageplatform/discord/discord.py +288 -0
- autogen/tools/experimental/messageplatform/slack/__init__.py +7 -0
- autogen/tools/experimental/messageplatform/slack/slack.py +391 -0
- autogen/tools/experimental/messageplatform/telegram/__init__.py +7 -0
- autogen/tools/experimental/messageplatform/telegram/telegram.py +275 -0
- autogen/tools/experimental/perplexity/__init__.py +7 -0
- autogen/tools/experimental/perplexity/perplexity_search.py +260 -0
- autogen/tools/experimental/tavily/__init__.py +7 -0
- autogen/tools/experimental/tavily/tavily_search.py +183 -0
- autogen/tools/experimental/web_search_preview/__init__.py +7 -0
- autogen/tools/experimental/web_search_preview/web_search_preview.py +114 -0
- autogen/tools/experimental/wikipedia/__init__.py +7 -0
- autogen/tools/experimental/wikipedia/wikipedia.py +287 -0
- autogen/tools/function_utils.py +411 -0
- autogen/tools/tool.py +187 -0
- autogen/tools/toolkit.py +86 -0
- autogen/types.py +29 -0
- autogen/version.py +7 -0
- ag2-0.9.1.dist-info/RECORD +0 -6
- ag2-0.9.1.dist-info/top_level.txt +0 -1
- {ag2-0.9.1.dist-info → ag2-0.9.1.post0.dist-info/licenses}/LICENSE +0 -0
- {ag2-0.9.1.dist-info → ag2-0.9.1.post0.dist-info/licenses}/NOTICE.md +0 -0
autogen/oai/cerebras.py
ADDED
|
@@ -0,0 +1,299 @@
|
|
|
1
|
+
# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
|
|
2
|
+
#
|
|
3
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
4
|
+
#
|
|
5
|
+
# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
|
|
6
|
+
# SPDX-License-Identifier: MIT
|
|
7
|
+
"""Create an OpenAI-compatible client using Cerebras's API.
|
|
8
|
+
|
|
9
|
+
Example:
|
|
10
|
+
```python
|
|
11
|
+
llm_config = {
|
|
12
|
+
"config_list": [{"api_type": "cerebras", "model": "llama3.1-8b", "api_key": os.environ.get("CEREBRAS_API_KEY")}]
|
|
13
|
+
}
|
|
14
|
+
|
|
15
|
+
agent = autogen.AssistantAgent("my_agent", llm_config=llm_config)
|
|
16
|
+
```
|
|
17
|
+
|
|
18
|
+
Install Cerebras's python library using: pip install --upgrade cerebras_cloud_sdk
|
|
19
|
+
|
|
20
|
+
Resources:
|
|
21
|
+
- https://inference-docs.cerebras.ai/quickstart
|
|
22
|
+
"""
|
|
23
|
+
|
|
24
|
+
from __future__ import annotations
|
|
25
|
+
|
|
26
|
+
import copy
|
|
27
|
+
import math
|
|
28
|
+
import os
|
|
29
|
+
import time
|
|
30
|
+
import warnings
|
|
31
|
+
from typing import Any, Literal, Optional
|
|
32
|
+
|
|
33
|
+
from pydantic import Field, ValidationInfo, field_validator
|
|
34
|
+
|
|
35
|
+
from ..import_utils import optional_import_block, require_optional_import
|
|
36
|
+
from ..llm_config import LLMConfigEntry, register_llm_config
|
|
37
|
+
from .client_utils import should_hide_tools, validate_parameter
|
|
38
|
+
from .oai_models import ChatCompletion, ChatCompletionMessage, ChatCompletionMessageToolCall, Choice, CompletionUsage
|
|
39
|
+
|
|
40
|
+
with optional_import_block():
|
|
41
|
+
from cerebras.cloud.sdk import Cerebras, Stream
|
|
42
|
+
|
|
43
|
+
CEREBRAS_PRICING_1K = {
|
|
44
|
+
# Convert pricing per million to per thousand tokens.
|
|
45
|
+
"llama3.1-8b": (0.10 / 1000, 0.10 / 1000),
|
|
46
|
+
"llama-3.3-70b": (0.85 / 1000, 1.20 / 1000),
|
|
47
|
+
}
|
|
48
|
+
|
|
49
|
+
|
|
50
|
+
@register_llm_config
|
|
51
|
+
class CerebrasLLMConfigEntry(LLMConfigEntry):
|
|
52
|
+
api_type: Literal["cerebras"] = "cerebras"
|
|
53
|
+
max_tokens: Optional[int] = None
|
|
54
|
+
seed: Optional[int] = None
|
|
55
|
+
stream: bool = False
|
|
56
|
+
temperature: float = Field(default=1.0, ge=0.0, le=1.5)
|
|
57
|
+
top_p: Optional[float] = None
|
|
58
|
+
hide_tools: Literal["if_all_run", "if_any_run", "never"] = "never"
|
|
59
|
+
tool_choice: Optional[Literal["none", "auto", "required"]] = None
|
|
60
|
+
|
|
61
|
+
@field_validator("top_p", mode="before")
|
|
62
|
+
@classmethod
|
|
63
|
+
def check_top_p(cls, v: Any, info: ValidationInfo) -> Any:
|
|
64
|
+
if v is not None and info.data.get("temperature") is not None:
|
|
65
|
+
raise ValueError("temperature and top_p cannot be set at the same time.")
|
|
66
|
+
return v
|
|
67
|
+
|
|
68
|
+
def create_client(self):
|
|
69
|
+
raise NotImplementedError("CerebrasLLMConfigEntry.create_client is not implemented.")
|
|
70
|
+
|
|
71
|
+
|
|
72
|
+
class CerebrasClient:
|
|
73
|
+
"""Client for Cerebras's API."""
|
|
74
|
+
|
|
75
|
+
def __init__(self, api_key=None, **kwargs):
|
|
76
|
+
"""Requires api_key or environment variable to be set
|
|
77
|
+
|
|
78
|
+
Args:
|
|
79
|
+
api_key (str): The API key for using Cerebras (or environment variable CEREBRAS_API_KEY needs to be set)
|
|
80
|
+
**kwargs: Additional keyword arguments to pass to the Cerebras client
|
|
81
|
+
"""
|
|
82
|
+
# Ensure we have the api_key upon instantiation
|
|
83
|
+
self.api_key = api_key
|
|
84
|
+
if not self.api_key:
|
|
85
|
+
self.api_key = os.getenv("CEREBRAS_API_KEY")
|
|
86
|
+
|
|
87
|
+
assert self.api_key, (
|
|
88
|
+
"Please include the api_key in your config list entry for Cerebras or set the CEREBRAS_API_KEY env variable."
|
|
89
|
+
)
|
|
90
|
+
|
|
91
|
+
if "response_format" in kwargs and kwargs["response_format"] is not None:
|
|
92
|
+
warnings.warn("response_format is not supported for Crebras, it will be ignored.", UserWarning)
|
|
93
|
+
|
|
94
|
+
def message_retrieval(self, response: ChatCompletion) -> list:
|
|
95
|
+
"""Retrieve and return a list of strings or a list of Choice.Message from the response.
|
|
96
|
+
|
|
97
|
+
NOTE: if a list of Choice.Message is returned, it currently needs to contain the fields of OpenAI's ChatCompletion Message object,
|
|
98
|
+
since that is expected for function or tool calling in the rest of the codebase at the moment, unless a custom agent is being used.
|
|
99
|
+
"""
|
|
100
|
+
return [choice.message for choice in response.choices]
|
|
101
|
+
|
|
102
|
+
def cost(self, response: ChatCompletion) -> float:
|
|
103
|
+
# Note: This field isn't explicitly in `ChatCompletion`, but is injected during chat creation.
|
|
104
|
+
return response.cost
|
|
105
|
+
|
|
106
|
+
@staticmethod
|
|
107
|
+
def get_usage(response: ChatCompletion) -> dict:
|
|
108
|
+
"""Return usage summary of the response using RESPONSE_USAGE_KEYS."""
|
|
109
|
+
# ... # pragma: no cover
|
|
110
|
+
return {
|
|
111
|
+
"prompt_tokens": response.usage.prompt_tokens,
|
|
112
|
+
"completion_tokens": response.usage.completion_tokens,
|
|
113
|
+
"total_tokens": response.usage.total_tokens,
|
|
114
|
+
"cost": response.cost,
|
|
115
|
+
"model": response.model,
|
|
116
|
+
}
|
|
117
|
+
|
|
118
|
+
def parse_params(self, params: dict[str, Any]) -> dict[str, Any]:
|
|
119
|
+
"""Loads the parameters for Cerebras API from the passed in parameters and returns a validated set. Checks types, ranges, and sets defaults"""
|
|
120
|
+
cerebras_params = {}
|
|
121
|
+
|
|
122
|
+
# Check that we have what we need to use Cerebras's API
|
|
123
|
+
# We won't enforce the available models as they are likely to change
|
|
124
|
+
cerebras_params["model"] = params.get("model")
|
|
125
|
+
assert cerebras_params["model"], (
|
|
126
|
+
"Please specify the 'model' in your config list entry to nominate the Cerebras model to use."
|
|
127
|
+
)
|
|
128
|
+
|
|
129
|
+
# Validate allowed Cerebras parameters
|
|
130
|
+
# https://inference-docs.cerebras.ai/api-reference/chat-completions
|
|
131
|
+
cerebras_params["max_tokens"] = validate_parameter(params, "max_tokens", int, True, None, (0, None), None)
|
|
132
|
+
cerebras_params["seed"] = validate_parameter(params, "seed", int, True, None, None, None)
|
|
133
|
+
cerebras_params["stream"] = validate_parameter(params, "stream", bool, True, False, None, None)
|
|
134
|
+
cerebras_params["temperature"] = validate_parameter(
|
|
135
|
+
params, "temperature", (int, float), True, 1, (0, 1.5), None
|
|
136
|
+
)
|
|
137
|
+
cerebras_params["top_p"] = validate_parameter(params, "top_p", (int, float), True, None, None, None)
|
|
138
|
+
cerebras_params["tool_choice"] = validate_parameter(
|
|
139
|
+
params, "tool_choice", str, True, None, None, ["none", "auto", "required"]
|
|
140
|
+
)
|
|
141
|
+
|
|
142
|
+
return cerebras_params
|
|
143
|
+
|
|
144
|
+
@require_optional_import("cerebras", "cerebras")
|
|
145
|
+
def create(self, params: dict) -> ChatCompletion:
|
|
146
|
+
messages = params.get("messages", [])
|
|
147
|
+
|
|
148
|
+
# Convert AG2 messages to Cerebras messages
|
|
149
|
+
cerebras_messages = oai_messages_to_cerebras_messages(messages)
|
|
150
|
+
|
|
151
|
+
# Parse parameters to the Cerebras API's parameters
|
|
152
|
+
cerebras_params = self.parse_params(params)
|
|
153
|
+
|
|
154
|
+
# Add tools to the call if we have them and aren't hiding them
|
|
155
|
+
if "tools" in params:
|
|
156
|
+
hide_tools = validate_parameter(
|
|
157
|
+
params, "hide_tools", str, False, "never", None, ["if_all_run", "if_any_run", "never"]
|
|
158
|
+
)
|
|
159
|
+
if not should_hide_tools(cerebras_messages, params["tools"], hide_tools):
|
|
160
|
+
cerebras_params["tools"] = params["tools"]
|
|
161
|
+
|
|
162
|
+
cerebras_params["messages"] = cerebras_messages
|
|
163
|
+
|
|
164
|
+
# We use chat model by default, and set max_retries to 5 (in line with typical retries loop)
|
|
165
|
+
client = Cerebras(api_key=self.api_key, max_retries=5)
|
|
166
|
+
|
|
167
|
+
# Token counts will be returned
|
|
168
|
+
prompt_tokens = 0
|
|
169
|
+
completion_tokens = 0
|
|
170
|
+
total_tokens = 0
|
|
171
|
+
|
|
172
|
+
# Streaming tool call recommendations
|
|
173
|
+
streaming_tool_calls = []
|
|
174
|
+
|
|
175
|
+
ans = None
|
|
176
|
+
response = client.chat.completions.create(**cerebras_params)
|
|
177
|
+
|
|
178
|
+
if cerebras_params["stream"]:
|
|
179
|
+
# Read in the chunks as they stream, taking in tool_calls which may be across
|
|
180
|
+
# multiple chunks if more than one suggested
|
|
181
|
+
ans = ""
|
|
182
|
+
for chunk in response:
|
|
183
|
+
# Grab first choice, which _should_ always be generated.
|
|
184
|
+
ans = ans + (getattr(chunk.choices[0].delta, "content", None) or "")
|
|
185
|
+
|
|
186
|
+
if "tool_calls" in chunk.choices[0].delta:
|
|
187
|
+
# We have a tool call recommendation
|
|
188
|
+
for tool_call in chunk.choices[0].delta["tool_calls"]:
|
|
189
|
+
streaming_tool_calls.append(
|
|
190
|
+
ChatCompletionMessageToolCall(
|
|
191
|
+
id=tool_call["id"],
|
|
192
|
+
function={
|
|
193
|
+
"name": tool_call["function"]["name"],
|
|
194
|
+
"arguments": tool_call["function"]["arguments"],
|
|
195
|
+
},
|
|
196
|
+
type="function",
|
|
197
|
+
)
|
|
198
|
+
)
|
|
199
|
+
|
|
200
|
+
if chunk.choices[0].finish_reason:
|
|
201
|
+
prompt_tokens = chunk.usage.prompt_tokens
|
|
202
|
+
completion_tokens = chunk.usage.completion_tokens
|
|
203
|
+
total_tokens = chunk.usage.total_tokens
|
|
204
|
+
else:
|
|
205
|
+
# Non-streaming finished
|
|
206
|
+
ans: str = response.choices[0].message.content
|
|
207
|
+
|
|
208
|
+
prompt_tokens = response.usage.prompt_tokens
|
|
209
|
+
completion_tokens = response.usage.completion_tokens
|
|
210
|
+
total_tokens = response.usage.total_tokens
|
|
211
|
+
|
|
212
|
+
if response is not None:
|
|
213
|
+
if isinstance(response, Stream):
|
|
214
|
+
# Streaming response
|
|
215
|
+
if chunk.choices[0].finish_reason == "tool_calls":
|
|
216
|
+
cerebras_finish = "tool_calls"
|
|
217
|
+
tool_calls = streaming_tool_calls
|
|
218
|
+
else:
|
|
219
|
+
cerebras_finish = "stop"
|
|
220
|
+
tool_calls = None
|
|
221
|
+
|
|
222
|
+
response_content = ans
|
|
223
|
+
response_id = chunk.id
|
|
224
|
+
else:
|
|
225
|
+
# Non-streaming response
|
|
226
|
+
# If we have tool calls as the response, populate completed tool calls for our return OAI response
|
|
227
|
+
if response.choices[0].finish_reason == "tool_calls":
|
|
228
|
+
cerebras_finish = "tool_calls"
|
|
229
|
+
tool_calls = []
|
|
230
|
+
for tool_call in response.choices[0].message.tool_calls:
|
|
231
|
+
tool_calls.append(
|
|
232
|
+
ChatCompletionMessageToolCall(
|
|
233
|
+
id=tool_call.id,
|
|
234
|
+
function={"name": tool_call.function.name, "arguments": tool_call.function.arguments},
|
|
235
|
+
type="function",
|
|
236
|
+
)
|
|
237
|
+
)
|
|
238
|
+
else:
|
|
239
|
+
cerebras_finish = "stop"
|
|
240
|
+
tool_calls = None
|
|
241
|
+
|
|
242
|
+
response_content = response.choices[0].message.content
|
|
243
|
+
response_id = response.id
|
|
244
|
+
|
|
245
|
+
# 3. convert output
|
|
246
|
+
message = ChatCompletionMessage(
|
|
247
|
+
role="assistant",
|
|
248
|
+
content=response_content,
|
|
249
|
+
function_call=None,
|
|
250
|
+
tool_calls=tool_calls,
|
|
251
|
+
)
|
|
252
|
+
choices = [Choice(finish_reason=cerebras_finish, index=0, message=message)]
|
|
253
|
+
|
|
254
|
+
response_oai = ChatCompletion(
|
|
255
|
+
id=response_id,
|
|
256
|
+
model=cerebras_params["model"],
|
|
257
|
+
created=int(time.time()),
|
|
258
|
+
object="chat.completion",
|
|
259
|
+
choices=choices,
|
|
260
|
+
usage=CompletionUsage(
|
|
261
|
+
prompt_tokens=prompt_tokens,
|
|
262
|
+
completion_tokens=completion_tokens,
|
|
263
|
+
total_tokens=total_tokens,
|
|
264
|
+
),
|
|
265
|
+
# Note: This seems to be a field that isn't in the schema of `ChatCompletion`, so Pydantic
|
|
266
|
+
# just adds it dynamically.
|
|
267
|
+
cost=calculate_cerebras_cost(prompt_tokens, completion_tokens, cerebras_params["model"]),
|
|
268
|
+
)
|
|
269
|
+
|
|
270
|
+
return response_oai
|
|
271
|
+
|
|
272
|
+
|
|
273
|
+
def oai_messages_to_cerebras_messages(messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
|
|
274
|
+
"""Convert messages from OAI format to Cerebras's format.
|
|
275
|
+
We correct for any specific role orders and types.
|
|
276
|
+
"""
|
|
277
|
+
cerebras_messages = copy.deepcopy(messages)
|
|
278
|
+
|
|
279
|
+
# Remove the name field
|
|
280
|
+
for message in cerebras_messages:
|
|
281
|
+
if "name" in message:
|
|
282
|
+
message.pop("name", None)
|
|
283
|
+
|
|
284
|
+
return cerebras_messages
|
|
285
|
+
|
|
286
|
+
|
|
287
|
+
def calculate_cerebras_cost(input_tokens: int, output_tokens: int, model: str) -> float:
|
|
288
|
+
"""Calculate the cost of the completion using the Cerebras pricing."""
|
|
289
|
+
total = 0.0
|
|
290
|
+
|
|
291
|
+
if model in CEREBRAS_PRICING_1K:
|
|
292
|
+
input_cost_per_k, output_cost_per_k = CEREBRAS_PRICING_1K[model]
|
|
293
|
+
input_cost = math.ceil((input_tokens / 1000) * input_cost_per_k * 1e6) / 1e6
|
|
294
|
+
output_cost = math.ceil((output_tokens / 1000) * output_cost_per_k * 1e6) / 1e6
|
|
295
|
+
total = math.ceil((input_cost + output_cost) * 1e6) / 1e6
|
|
296
|
+
else:
|
|
297
|
+
warnings.warn(f"Cost calculation not available for model {model}", UserWarning)
|
|
298
|
+
|
|
299
|
+
return total
|