ag2 0.9.1__py3-none-any.whl → 0.9.1.post0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of ag2 might be problematic. Click here for more details.
- {ag2-0.9.1.dist-info → ag2-0.9.1.post0.dist-info}/METADATA +264 -73
- ag2-0.9.1.post0.dist-info/RECORD +392 -0
- {ag2-0.9.1.dist-info → ag2-0.9.1.post0.dist-info}/WHEEL +1 -2
- autogen/__init__.py +89 -0
- autogen/_website/__init__.py +3 -0
- autogen/_website/generate_api_references.py +427 -0
- autogen/_website/generate_mkdocs.py +1174 -0
- autogen/_website/notebook_processor.py +476 -0
- autogen/_website/process_notebooks.py +656 -0
- autogen/_website/utils.py +412 -0
- autogen/agentchat/__init__.py +44 -0
- autogen/agentchat/agent.py +182 -0
- autogen/agentchat/assistant_agent.py +85 -0
- autogen/agentchat/chat.py +309 -0
- autogen/agentchat/contrib/__init__.py +5 -0
- autogen/agentchat/contrib/agent_eval/README.md +7 -0
- autogen/agentchat/contrib/agent_eval/agent_eval.py +108 -0
- autogen/agentchat/contrib/agent_eval/criterion.py +43 -0
- autogen/agentchat/contrib/agent_eval/critic_agent.py +44 -0
- autogen/agentchat/contrib/agent_eval/quantifier_agent.py +39 -0
- autogen/agentchat/contrib/agent_eval/subcritic_agent.py +45 -0
- autogen/agentchat/contrib/agent_eval/task.py +42 -0
- autogen/agentchat/contrib/agent_optimizer.py +429 -0
- autogen/agentchat/contrib/capabilities/__init__.py +5 -0
- autogen/agentchat/contrib/capabilities/agent_capability.py +20 -0
- autogen/agentchat/contrib/capabilities/generate_images.py +301 -0
- autogen/agentchat/contrib/capabilities/teachability.py +393 -0
- autogen/agentchat/contrib/capabilities/text_compressors.py +66 -0
- autogen/agentchat/contrib/capabilities/tools_capability.py +22 -0
- autogen/agentchat/contrib/capabilities/transform_messages.py +93 -0
- autogen/agentchat/contrib/capabilities/transforms.py +566 -0
- autogen/agentchat/contrib/capabilities/transforms_util.py +122 -0
- autogen/agentchat/contrib/capabilities/vision_capability.py +214 -0
- autogen/agentchat/contrib/captainagent/__init__.py +9 -0
- autogen/agentchat/contrib/captainagent/agent_builder.py +790 -0
- autogen/agentchat/contrib/captainagent/captainagent.py +512 -0
- autogen/agentchat/contrib/captainagent/tool_retriever.py +335 -0
- autogen/agentchat/contrib/captainagent/tools/README.md +44 -0
- autogen/agentchat/contrib/captainagent/tools/__init__.py +5 -0
- autogen/agentchat/contrib/captainagent/tools/data_analysis/calculate_correlation.py +40 -0
- autogen/agentchat/contrib/captainagent/tools/data_analysis/calculate_skewness_and_kurtosis.py +28 -0
- autogen/agentchat/contrib/captainagent/tools/data_analysis/detect_outlier_iqr.py +28 -0
- autogen/agentchat/contrib/captainagent/tools/data_analysis/detect_outlier_zscore.py +28 -0
- autogen/agentchat/contrib/captainagent/tools/data_analysis/explore_csv.py +21 -0
- autogen/agentchat/contrib/captainagent/tools/data_analysis/shapiro_wilk_test.py +30 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/arxiv_download.py +27 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/arxiv_search.py +53 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/extract_pdf_image.py +53 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/extract_pdf_text.py +38 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/get_wikipedia_text.py +21 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/get_youtube_caption.py +34 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/image_qa.py +60 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/optical_character_recognition.py +61 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/perform_web_search.py +47 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/scrape_wikipedia_tables.py +33 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/transcribe_audio_file.py +21 -0
- autogen/agentchat/contrib/captainagent/tools/information_retrieval/youtube_download.py +35 -0
- autogen/agentchat/contrib/captainagent/tools/math/calculate_circle_area_from_diameter.py +21 -0
- autogen/agentchat/contrib/captainagent/tools/math/calculate_day_of_the_week.py +18 -0
- autogen/agentchat/contrib/captainagent/tools/math/calculate_fraction_sum.py +28 -0
- autogen/agentchat/contrib/captainagent/tools/math/calculate_matrix_power.py +31 -0
- autogen/agentchat/contrib/captainagent/tools/math/calculate_reflected_point.py +16 -0
- autogen/agentchat/contrib/captainagent/tools/math/complex_numbers_product.py +25 -0
- autogen/agentchat/contrib/captainagent/tools/math/compute_currency_conversion.py +23 -0
- autogen/agentchat/contrib/captainagent/tools/math/count_distinct_permutations.py +27 -0
- autogen/agentchat/contrib/captainagent/tools/math/evaluate_expression.py +28 -0
- autogen/agentchat/contrib/captainagent/tools/math/find_continuity_point.py +34 -0
- autogen/agentchat/contrib/captainagent/tools/math/fraction_to_mixed_numbers.py +39 -0
- autogen/agentchat/contrib/captainagent/tools/math/modular_inverse_sum.py +23 -0
- autogen/agentchat/contrib/captainagent/tools/math/simplify_mixed_numbers.py +36 -0
- autogen/agentchat/contrib/captainagent/tools/math/sum_of_digit_factorials.py +15 -0
- autogen/agentchat/contrib/captainagent/tools/math/sum_of_primes_below.py +15 -0
- autogen/agentchat/contrib/captainagent/tools/requirements.txt +10 -0
- autogen/agentchat/contrib/captainagent/tools/tool_description.tsv +34 -0
- autogen/agentchat/contrib/gpt_assistant_agent.py +526 -0
- autogen/agentchat/contrib/graph_rag/__init__.py +9 -0
- autogen/agentchat/contrib/graph_rag/document.py +29 -0
- autogen/agentchat/contrib/graph_rag/falkor_graph_query_engine.py +170 -0
- autogen/agentchat/contrib/graph_rag/falkor_graph_rag_capability.py +103 -0
- autogen/agentchat/contrib/graph_rag/graph_query_engine.py +53 -0
- autogen/agentchat/contrib/graph_rag/graph_rag_capability.py +63 -0
- autogen/agentchat/contrib/graph_rag/neo4j_graph_query_engine.py +268 -0
- autogen/agentchat/contrib/graph_rag/neo4j_graph_rag_capability.py +83 -0
- autogen/agentchat/contrib/graph_rag/neo4j_native_graph_query_engine.py +210 -0
- autogen/agentchat/contrib/graph_rag/neo4j_native_graph_rag_capability.py +93 -0
- autogen/agentchat/contrib/img_utils.py +397 -0
- autogen/agentchat/contrib/llamaindex_conversable_agent.py +117 -0
- autogen/agentchat/contrib/llava_agent.py +187 -0
- autogen/agentchat/contrib/math_user_proxy_agent.py +464 -0
- autogen/agentchat/contrib/multimodal_conversable_agent.py +125 -0
- autogen/agentchat/contrib/qdrant_retrieve_user_proxy_agent.py +324 -0
- autogen/agentchat/contrib/rag/__init__.py +10 -0
- autogen/agentchat/contrib/rag/chromadb_query_engine.py +272 -0
- autogen/agentchat/contrib/rag/llamaindex_query_engine.py +198 -0
- autogen/agentchat/contrib/rag/mongodb_query_engine.py +329 -0
- autogen/agentchat/contrib/rag/query_engine.py +74 -0
- autogen/agentchat/contrib/retrieve_assistant_agent.py +56 -0
- autogen/agentchat/contrib/retrieve_user_proxy_agent.py +703 -0
- autogen/agentchat/contrib/society_of_mind_agent.py +199 -0
- autogen/agentchat/contrib/swarm_agent.py +1425 -0
- autogen/agentchat/contrib/text_analyzer_agent.py +79 -0
- autogen/agentchat/contrib/vectordb/__init__.py +5 -0
- autogen/agentchat/contrib/vectordb/base.py +232 -0
- autogen/agentchat/contrib/vectordb/chromadb.py +315 -0
- autogen/agentchat/contrib/vectordb/couchbase.py +407 -0
- autogen/agentchat/contrib/vectordb/mongodb.py +550 -0
- autogen/agentchat/contrib/vectordb/pgvectordb.py +928 -0
- autogen/agentchat/contrib/vectordb/qdrant.py +320 -0
- autogen/agentchat/contrib/vectordb/utils.py +126 -0
- autogen/agentchat/contrib/web_surfer.py +303 -0
- autogen/agentchat/conversable_agent.py +4020 -0
- autogen/agentchat/group/__init__.py +64 -0
- autogen/agentchat/group/available_condition.py +91 -0
- autogen/agentchat/group/context_condition.py +77 -0
- autogen/agentchat/group/context_expression.py +238 -0
- autogen/agentchat/group/context_str.py +41 -0
- autogen/agentchat/group/context_variables.py +192 -0
- autogen/agentchat/group/group_tool_executor.py +202 -0
- autogen/agentchat/group/group_utils.py +591 -0
- autogen/agentchat/group/handoffs.py +244 -0
- autogen/agentchat/group/llm_condition.py +93 -0
- autogen/agentchat/group/multi_agent_chat.py +237 -0
- autogen/agentchat/group/on_condition.py +58 -0
- autogen/agentchat/group/on_context_condition.py +54 -0
- autogen/agentchat/group/patterns/__init__.py +18 -0
- autogen/agentchat/group/patterns/auto.py +159 -0
- autogen/agentchat/group/patterns/manual.py +176 -0
- autogen/agentchat/group/patterns/pattern.py +288 -0
- autogen/agentchat/group/patterns/random.py +106 -0
- autogen/agentchat/group/patterns/round_robin.py +117 -0
- autogen/agentchat/group/reply_result.py +26 -0
- autogen/agentchat/group/speaker_selection_result.py +41 -0
- autogen/agentchat/group/targets/__init__.py +4 -0
- autogen/agentchat/group/targets/group_chat_target.py +132 -0
- autogen/agentchat/group/targets/group_manager_target.py +151 -0
- autogen/agentchat/group/targets/transition_target.py +413 -0
- autogen/agentchat/group/targets/transition_utils.py +6 -0
- autogen/agentchat/groupchat.py +1694 -0
- autogen/agentchat/realtime/__init__.py +3 -0
- autogen/agentchat/realtime/experimental/__init__.py +20 -0
- autogen/agentchat/realtime/experimental/audio_adapters/__init__.py +8 -0
- autogen/agentchat/realtime/experimental/audio_adapters/twilio_audio_adapter.py +148 -0
- autogen/agentchat/realtime/experimental/audio_adapters/websocket_audio_adapter.py +139 -0
- autogen/agentchat/realtime/experimental/audio_observer.py +42 -0
- autogen/agentchat/realtime/experimental/clients/__init__.py +15 -0
- autogen/agentchat/realtime/experimental/clients/gemini/__init__.py +7 -0
- autogen/agentchat/realtime/experimental/clients/gemini/client.py +274 -0
- autogen/agentchat/realtime/experimental/clients/oai/__init__.py +8 -0
- autogen/agentchat/realtime/experimental/clients/oai/base_client.py +220 -0
- autogen/agentchat/realtime/experimental/clients/oai/rtc_client.py +243 -0
- autogen/agentchat/realtime/experimental/clients/oai/utils.py +48 -0
- autogen/agentchat/realtime/experimental/clients/realtime_client.py +190 -0
- autogen/agentchat/realtime/experimental/function_observer.py +85 -0
- autogen/agentchat/realtime/experimental/realtime_agent.py +158 -0
- autogen/agentchat/realtime/experimental/realtime_events.py +42 -0
- autogen/agentchat/realtime/experimental/realtime_observer.py +100 -0
- autogen/agentchat/realtime/experimental/realtime_swarm.py +475 -0
- autogen/agentchat/realtime/experimental/websockets.py +21 -0
- autogen/agentchat/realtime_agent/__init__.py +21 -0
- autogen/agentchat/user_proxy_agent.py +111 -0
- autogen/agentchat/utils.py +206 -0
- autogen/agents/__init__.py +3 -0
- autogen/agents/contrib/__init__.py +10 -0
- autogen/agents/contrib/time/__init__.py +8 -0
- autogen/agents/contrib/time/time_reply_agent.py +73 -0
- autogen/agents/contrib/time/time_tool_agent.py +51 -0
- autogen/agents/experimental/__init__.py +27 -0
- autogen/agents/experimental/deep_research/__init__.py +7 -0
- autogen/agents/experimental/deep_research/deep_research.py +52 -0
- autogen/agents/experimental/discord/__init__.py +7 -0
- autogen/agents/experimental/discord/discord.py +66 -0
- autogen/agents/experimental/document_agent/__init__.py +19 -0
- autogen/agents/experimental/document_agent/chroma_query_engine.py +316 -0
- autogen/agents/experimental/document_agent/docling_doc_ingest_agent.py +118 -0
- autogen/agents/experimental/document_agent/document_agent.py +461 -0
- autogen/agents/experimental/document_agent/document_conditions.py +50 -0
- autogen/agents/experimental/document_agent/document_utils.py +380 -0
- autogen/agents/experimental/document_agent/inmemory_query_engine.py +220 -0
- autogen/agents/experimental/document_agent/parser_utils.py +130 -0
- autogen/agents/experimental/document_agent/url_utils.py +426 -0
- autogen/agents/experimental/reasoning/__init__.py +7 -0
- autogen/agents/experimental/reasoning/reasoning_agent.py +1178 -0
- autogen/agents/experimental/slack/__init__.py +7 -0
- autogen/agents/experimental/slack/slack.py +73 -0
- autogen/agents/experimental/telegram/__init__.py +7 -0
- autogen/agents/experimental/telegram/telegram.py +77 -0
- autogen/agents/experimental/websurfer/__init__.py +7 -0
- autogen/agents/experimental/websurfer/websurfer.py +62 -0
- autogen/agents/experimental/wikipedia/__init__.py +7 -0
- autogen/agents/experimental/wikipedia/wikipedia.py +90 -0
- autogen/browser_utils.py +309 -0
- autogen/cache/__init__.py +10 -0
- autogen/cache/abstract_cache_base.py +75 -0
- autogen/cache/cache.py +203 -0
- autogen/cache/cache_factory.py +88 -0
- autogen/cache/cosmos_db_cache.py +144 -0
- autogen/cache/disk_cache.py +102 -0
- autogen/cache/in_memory_cache.py +58 -0
- autogen/cache/redis_cache.py +123 -0
- autogen/code_utils.py +596 -0
- autogen/coding/__init__.py +22 -0
- autogen/coding/base.py +119 -0
- autogen/coding/docker_commandline_code_executor.py +268 -0
- autogen/coding/factory.py +47 -0
- autogen/coding/func_with_reqs.py +202 -0
- autogen/coding/jupyter/__init__.py +23 -0
- autogen/coding/jupyter/base.py +36 -0
- autogen/coding/jupyter/docker_jupyter_server.py +167 -0
- autogen/coding/jupyter/embedded_ipython_code_executor.py +182 -0
- autogen/coding/jupyter/import_utils.py +82 -0
- autogen/coding/jupyter/jupyter_client.py +231 -0
- autogen/coding/jupyter/jupyter_code_executor.py +160 -0
- autogen/coding/jupyter/local_jupyter_server.py +172 -0
- autogen/coding/local_commandline_code_executor.py +405 -0
- autogen/coding/markdown_code_extractor.py +45 -0
- autogen/coding/utils.py +56 -0
- autogen/doc_utils.py +34 -0
- autogen/events/__init__.py +7 -0
- autogen/events/agent_events.py +1010 -0
- autogen/events/base_event.py +99 -0
- autogen/events/client_events.py +167 -0
- autogen/events/helpers.py +36 -0
- autogen/events/print_event.py +46 -0
- autogen/exception_utils.py +73 -0
- autogen/extensions/__init__.py +5 -0
- autogen/fast_depends/__init__.py +16 -0
- autogen/fast_depends/_compat.py +80 -0
- autogen/fast_depends/core/__init__.py +14 -0
- autogen/fast_depends/core/build.py +225 -0
- autogen/fast_depends/core/model.py +576 -0
- autogen/fast_depends/dependencies/__init__.py +15 -0
- autogen/fast_depends/dependencies/model.py +29 -0
- autogen/fast_depends/dependencies/provider.py +39 -0
- autogen/fast_depends/library/__init__.py +10 -0
- autogen/fast_depends/library/model.py +46 -0
- autogen/fast_depends/py.typed +6 -0
- autogen/fast_depends/schema.py +66 -0
- autogen/fast_depends/use.py +280 -0
- autogen/fast_depends/utils.py +187 -0
- autogen/formatting_utils.py +83 -0
- autogen/function_utils.py +13 -0
- autogen/graph_utils.py +178 -0
- autogen/import_utils.py +526 -0
- autogen/interop/__init__.py +22 -0
- autogen/interop/crewai/__init__.py +7 -0
- autogen/interop/crewai/crewai.py +88 -0
- autogen/interop/interoperability.py +71 -0
- autogen/interop/interoperable.py +46 -0
- autogen/interop/langchain/__init__.py +8 -0
- autogen/interop/langchain/langchain_chat_model_factory.py +155 -0
- autogen/interop/langchain/langchain_tool.py +82 -0
- autogen/interop/litellm/__init__.py +7 -0
- autogen/interop/litellm/litellm_config_factory.py +113 -0
- autogen/interop/pydantic_ai/__init__.py +7 -0
- autogen/interop/pydantic_ai/pydantic_ai.py +168 -0
- autogen/interop/registry.py +69 -0
- autogen/io/__init__.py +15 -0
- autogen/io/base.py +151 -0
- autogen/io/console.py +56 -0
- autogen/io/processors/__init__.py +12 -0
- autogen/io/processors/base.py +21 -0
- autogen/io/processors/console_event_processor.py +56 -0
- autogen/io/run_response.py +293 -0
- autogen/io/thread_io_stream.py +63 -0
- autogen/io/websockets.py +213 -0
- autogen/json_utils.py +43 -0
- autogen/llm_config.py +379 -0
- autogen/logger/__init__.py +11 -0
- autogen/logger/base_logger.py +128 -0
- autogen/logger/file_logger.py +261 -0
- autogen/logger/logger_factory.py +42 -0
- autogen/logger/logger_utils.py +57 -0
- autogen/logger/sqlite_logger.py +523 -0
- autogen/math_utils.py +339 -0
- autogen/mcp/__init__.py +7 -0
- autogen/mcp/mcp_client.py +208 -0
- autogen/messages/__init__.py +7 -0
- autogen/messages/agent_messages.py +948 -0
- autogen/messages/base_message.py +107 -0
- autogen/messages/client_messages.py +171 -0
- autogen/messages/print_message.py +49 -0
- autogen/oai/__init__.py +53 -0
- autogen/oai/anthropic.py +714 -0
- autogen/oai/bedrock.py +628 -0
- autogen/oai/cerebras.py +299 -0
- autogen/oai/client.py +1435 -0
- autogen/oai/client_utils.py +169 -0
- autogen/oai/cohere.py +479 -0
- autogen/oai/gemini.py +990 -0
- autogen/oai/gemini_types.py +129 -0
- autogen/oai/groq.py +305 -0
- autogen/oai/mistral.py +303 -0
- autogen/oai/oai_models/__init__.py +11 -0
- autogen/oai/oai_models/_models.py +16 -0
- autogen/oai/oai_models/chat_completion.py +87 -0
- autogen/oai/oai_models/chat_completion_audio.py +32 -0
- autogen/oai/oai_models/chat_completion_message.py +86 -0
- autogen/oai/oai_models/chat_completion_message_tool_call.py +37 -0
- autogen/oai/oai_models/chat_completion_token_logprob.py +63 -0
- autogen/oai/oai_models/completion_usage.py +60 -0
- autogen/oai/ollama.py +643 -0
- autogen/oai/openai_utils.py +881 -0
- autogen/oai/together.py +370 -0
- autogen/retrieve_utils.py +491 -0
- autogen/runtime_logging.py +160 -0
- autogen/token_count_utils.py +267 -0
- autogen/tools/__init__.py +20 -0
- autogen/tools/contrib/__init__.py +9 -0
- autogen/tools/contrib/time/__init__.py +7 -0
- autogen/tools/contrib/time/time.py +41 -0
- autogen/tools/dependency_injection.py +254 -0
- autogen/tools/experimental/__init__.py +43 -0
- autogen/tools/experimental/browser_use/__init__.py +7 -0
- autogen/tools/experimental/browser_use/browser_use.py +161 -0
- autogen/tools/experimental/crawl4ai/__init__.py +7 -0
- autogen/tools/experimental/crawl4ai/crawl4ai.py +153 -0
- autogen/tools/experimental/deep_research/__init__.py +7 -0
- autogen/tools/experimental/deep_research/deep_research.py +328 -0
- autogen/tools/experimental/duckduckgo/__init__.py +7 -0
- autogen/tools/experimental/duckduckgo/duckduckgo_search.py +109 -0
- autogen/tools/experimental/google/__init__.py +14 -0
- autogen/tools/experimental/google/authentication/__init__.py +11 -0
- autogen/tools/experimental/google/authentication/credentials_hosted_provider.py +43 -0
- autogen/tools/experimental/google/authentication/credentials_local_provider.py +91 -0
- autogen/tools/experimental/google/authentication/credentials_provider.py +35 -0
- autogen/tools/experimental/google/drive/__init__.py +9 -0
- autogen/tools/experimental/google/drive/drive_functions.py +124 -0
- autogen/tools/experimental/google/drive/toolkit.py +88 -0
- autogen/tools/experimental/google/model.py +17 -0
- autogen/tools/experimental/google/toolkit_protocol.py +19 -0
- autogen/tools/experimental/google_search/__init__.py +8 -0
- autogen/tools/experimental/google_search/google_search.py +93 -0
- autogen/tools/experimental/google_search/youtube_search.py +181 -0
- autogen/tools/experimental/messageplatform/__init__.py +17 -0
- autogen/tools/experimental/messageplatform/discord/__init__.py +7 -0
- autogen/tools/experimental/messageplatform/discord/discord.py +288 -0
- autogen/tools/experimental/messageplatform/slack/__init__.py +7 -0
- autogen/tools/experimental/messageplatform/slack/slack.py +391 -0
- autogen/tools/experimental/messageplatform/telegram/__init__.py +7 -0
- autogen/tools/experimental/messageplatform/telegram/telegram.py +275 -0
- autogen/tools/experimental/perplexity/__init__.py +7 -0
- autogen/tools/experimental/perplexity/perplexity_search.py +260 -0
- autogen/tools/experimental/tavily/__init__.py +7 -0
- autogen/tools/experimental/tavily/tavily_search.py +183 -0
- autogen/tools/experimental/web_search_preview/__init__.py +7 -0
- autogen/tools/experimental/web_search_preview/web_search_preview.py +114 -0
- autogen/tools/experimental/wikipedia/__init__.py +7 -0
- autogen/tools/experimental/wikipedia/wikipedia.py +287 -0
- autogen/tools/function_utils.py +411 -0
- autogen/tools/tool.py +187 -0
- autogen/tools/toolkit.py +86 -0
- autogen/types.py +29 -0
- autogen/version.py +7 -0
- ag2-0.9.1.dist-info/RECORD +0 -6
- ag2-0.9.1.dist-info/top_level.txt +0 -1
- {ag2-0.9.1.dist-info → ag2-0.9.1.post0.dist-info/licenses}/LICENSE +0 -0
- {ag2-0.9.1.dist-info → ag2-0.9.1.post0.dist-info/licenses}/NOTICE.md +0 -0
autogen/code_utils.py
ADDED
|
@@ -0,0 +1,596 @@
|
|
|
1
|
+
# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
|
|
2
|
+
#
|
|
3
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
4
|
+
#
|
|
5
|
+
# Portions derived from https://github.com/microsoft/autogen are under the MIT License.
|
|
6
|
+
# SPDX-License-Identifier: MIT
|
|
7
|
+
import logging
|
|
8
|
+
import os
|
|
9
|
+
import pathlib
|
|
10
|
+
import re
|
|
11
|
+
import string
|
|
12
|
+
import subprocess
|
|
13
|
+
import sys
|
|
14
|
+
import time
|
|
15
|
+
import venv
|
|
16
|
+
from concurrent.futures import ThreadPoolExecutor, TimeoutError
|
|
17
|
+
from hashlib import md5
|
|
18
|
+
from types import SimpleNamespace
|
|
19
|
+
from typing import Callable, Optional, Union
|
|
20
|
+
|
|
21
|
+
import docker
|
|
22
|
+
|
|
23
|
+
from .types import UserMessageImageContentPart, UserMessageTextContentPart
|
|
24
|
+
|
|
25
|
+
SENTINEL = object()
|
|
26
|
+
DEFAULT_MODEL = "gpt-4"
|
|
27
|
+
FAST_MODEL = "gpt-3.5-turbo"
|
|
28
|
+
# Regular expression for finding a code block
|
|
29
|
+
# ```[ \t]*(\w+)?[ \t]*\r?\n(.*?)[ \t]*\r?\n``` Matches multi-line code blocks.
|
|
30
|
+
# The [ \t]* matches the potential spaces before language name.
|
|
31
|
+
# The (\w+)? matches the language, where the ? indicates it is optional.
|
|
32
|
+
# The [ \t]* matches the potential spaces (not newlines) after language name.
|
|
33
|
+
# The \r?\n makes sure there is a linebreak after ```.
|
|
34
|
+
# The (.*?) matches the code itself (non-greedy).
|
|
35
|
+
# The \r?\n makes sure there is a linebreak before ```.
|
|
36
|
+
# The [ \t]* matches the potential spaces before closing ``` (the spec allows indentation).
|
|
37
|
+
CODE_BLOCK_PATTERN = r"```[ \t]*(\w+)?[ \t]*\r?\n(.*?)\r?\n[ \t]*```"
|
|
38
|
+
WORKING_DIR = os.path.join(os.path.dirname(os.path.realpath(__file__)), "extensions")
|
|
39
|
+
UNKNOWN = "unknown"
|
|
40
|
+
TIMEOUT_MSG = "Timeout"
|
|
41
|
+
DEFAULT_TIMEOUT = 600
|
|
42
|
+
WIN32 = sys.platform == "win32"
|
|
43
|
+
PATH_SEPARATOR = (WIN32 and "\\") or "/"
|
|
44
|
+
PYTHON_VARIANTS = ["python", "Python", "py"]
|
|
45
|
+
|
|
46
|
+
logger = logging.getLogger(__name__)
|
|
47
|
+
|
|
48
|
+
|
|
49
|
+
def content_str(content: Union[str, list[Union[UserMessageTextContentPart, UserMessageImageContentPart]], None]) -> str:
|
|
50
|
+
"""Converts the `content` field of an OpenAI message into a string format.
|
|
51
|
+
|
|
52
|
+
This function processes content that may be a string, a list of mixed text and image URLs, or None,
|
|
53
|
+
and converts it into a string. Text is directly appended to the result string, while image URLs are
|
|
54
|
+
represented by a placeholder image token. If the content is None, an empty string is returned.
|
|
55
|
+
|
|
56
|
+
Args:
|
|
57
|
+
content: The content to be processed. Can be a string, a list of dictionaries representing text and image URLs, or None.
|
|
58
|
+
|
|
59
|
+
Returns:
|
|
60
|
+
str: A string representation of the input content. Image URLs are replaced with an image token.
|
|
61
|
+
|
|
62
|
+
Note:
|
|
63
|
+
- The function expects each dictionary in the list to have a "type" key that is either "text" or "image_url".
|
|
64
|
+
For "text" type, the "text" key's value is appended to the result. For "image_url", an image token is appended.
|
|
65
|
+
- This function is useful for handling content that may include both text and image references, especially
|
|
66
|
+
in contexts where images need to be represented as placeholders.
|
|
67
|
+
"""
|
|
68
|
+
if content is None:
|
|
69
|
+
return ""
|
|
70
|
+
if isinstance(content, str):
|
|
71
|
+
return content
|
|
72
|
+
if not isinstance(content, list):
|
|
73
|
+
raise TypeError(f"content must be None, str, or list, but got {type(content)}")
|
|
74
|
+
|
|
75
|
+
rst = ""
|
|
76
|
+
for item in content:
|
|
77
|
+
if not isinstance(item, dict):
|
|
78
|
+
raise TypeError("Wrong content format: every element should be dict if the content is a list.")
|
|
79
|
+
assert "type" in item, "Wrong content format. Missing 'type' key in content's dict."
|
|
80
|
+
if item["type"] == "text":
|
|
81
|
+
rst += item["text"]
|
|
82
|
+
elif item["type"] == "image_url":
|
|
83
|
+
rst += "<image>"
|
|
84
|
+
else:
|
|
85
|
+
raise ValueError(f"Wrong content format: unknown type {item['type']} within the content")
|
|
86
|
+
return rst
|
|
87
|
+
|
|
88
|
+
|
|
89
|
+
def infer_lang(code: str) -> str:
|
|
90
|
+
"""Infer the language for the code.
|
|
91
|
+
TODO: make it robust.
|
|
92
|
+
"""
|
|
93
|
+
if code.startswith("python ") or code.startswith("pip") or code.startswith("python3 "):
|
|
94
|
+
return "sh"
|
|
95
|
+
|
|
96
|
+
# check if code is a valid python code
|
|
97
|
+
try:
|
|
98
|
+
compile(code, "test", "exec")
|
|
99
|
+
return "python"
|
|
100
|
+
except SyntaxError:
|
|
101
|
+
# not a valid python code
|
|
102
|
+
return UNKNOWN
|
|
103
|
+
|
|
104
|
+
|
|
105
|
+
# TODO: In the future move, to better support https://spec.commonmark.org/0.30/#fenced-code-blocks
|
|
106
|
+
# perhaps by using a full Markdown parser.
|
|
107
|
+
def extract_code(
|
|
108
|
+
text: Union[str, list], pattern: str = CODE_BLOCK_PATTERN, detect_single_line_code: bool = False
|
|
109
|
+
) -> list[tuple[str, str]]:
|
|
110
|
+
"""Extract code from a text.
|
|
111
|
+
|
|
112
|
+
Args:
|
|
113
|
+
text (str or List): The content to extract code from. The content can be
|
|
114
|
+
a string or a list, as returned by standard GPT or multimodal GPT.
|
|
115
|
+
pattern (str, optional): The regular expression pattern for finding the
|
|
116
|
+
code block. Defaults to CODE_BLOCK_PATTERN.
|
|
117
|
+
detect_single_line_code (bool, optional): Enable the new feature for
|
|
118
|
+
extracting single line code. Defaults to False.
|
|
119
|
+
|
|
120
|
+
Returns:
|
|
121
|
+
list: A list of tuples, each containing the language and the code.
|
|
122
|
+
If there is no code block in the input text, the language would be "unknown".
|
|
123
|
+
If there is code block but the language is not specified, the language would be "".
|
|
124
|
+
"""
|
|
125
|
+
text = content_str(text)
|
|
126
|
+
if not detect_single_line_code:
|
|
127
|
+
match = re.findall(pattern, text, flags=re.DOTALL)
|
|
128
|
+
return match if match else [(UNKNOWN, text)]
|
|
129
|
+
|
|
130
|
+
# Extract both multi-line and single-line code block, separated by the | operator
|
|
131
|
+
# `([^`]+)`: Matches inline code.
|
|
132
|
+
code_pattern = re.compile(CODE_BLOCK_PATTERN + r"|`([^`]+)`")
|
|
133
|
+
code_blocks = code_pattern.findall(text)
|
|
134
|
+
|
|
135
|
+
# Extract the individual code blocks and languages from the matched groups
|
|
136
|
+
extracted = []
|
|
137
|
+
for lang, group1, group2 in code_blocks:
|
|
138
|
+
if group1:
|
|
139
|
+
extracted.append((lang.strip(), group1.strip()))
|
|
140
|
+
elif group2:
|
|
141
|
+
extracted.append(("", group2.strip()))
|
|
142
|
+
|
|
143
|
+
return extracted
|
|
144
|
+
|
|
145
|
+
|
|
146
|
+
def timeout_handler(signum, frame):
|
|
147
|
+
raise TimeoutError("Timed out!")
|
|
148
|
+
|
|
149
|
+
|
|
150
|
+
def get_powershell_command():
|
|
151
|
+
try:
|
|
152
|
+
result = subprocess.run(["powershell", "$PSVersionTable.PSVersion.Major"], capture_output=True, text=True)
|
|
153
|
+
if result.returncode == 0:
|
|
154
|
+
return "powershell"
|
|
155
|
+
except (FileNotFoundError, NotADirectoryError):
|
|
156
|
+
# This means that 'powershell' command is not found so now we try looking for 'pwsh'
|
|
157
|
+
try:
|
|
158
|
+
result = subprocess.run(
|
|
159
|
+
["pwsh", "-Command", "$PSVersionTable.PSVersion.Major"], capture_output=True, text=True
|
|
160
|
+
)
|
|
161
|
+
if result.returncode == 0:
|
|
162
|
+
return "pwsh"
|
|
163
|
+
except FileExistsError as e:
|
|
164
|
+
raise FileNotFoundError(
|
|
165
|
+
"Neither powershell.exe nor pwsh.exe is present in the system. "
|
|
166
|
+
"Please install PowerShell and try again. "
|
|
167
|
+
) from e
|
|
168
|
+
except NotADirectoryError as e:
|
|
169
|
+
raise NotADirectoryError(
|
|
170
|
+
"PowerShell is either not installed or its path is not given "
|
|
171
|
+
"properly in the environment variable PATH. Please check the "
|
|
172
|
+
"path and try again. "
|
|
173
|
+
) from e
|
|
174
|
+
except PermissionError as e:
|
|
175
|
+
raise PermissionError("No permission to run powershell.") from e
|
|
176
|
+
|
|
177
|
+
|
|
178
|
+
def _cmd(lang: str) -> str:
|
|
179
|
+
if lang in PYTHON_VARIANTS:
|
|
180
|
+
return "python"
|
|
181
|
+
if lang.startswith("python") or lang in ["bash", "sh"]:
|
|
182
|
+
return lang
|
|
183
|
+
if lang in ["shell"]:
|
|
184
|
+
return "sh"
|
|
185
|
+
if lang == "javascript":
|
|
186
|
+
return "node"
|
|
187
|
+
if lang in ["ps1", "pwsh", "powershell"]:
|
|
188
|
+
powershell_command = get_powershell_command()
|
|
189
|
+
return powershell_command
|
|
190
|
+
|
|
191
|
+
raise NotImplementedError(f"{lang} not recognized in code execution")
|
|
192
|
+
|
|
193
|
+
|
|
194
|
+
def is_docker_running() -> bool:
|
|
195
|
+
"""Check if docker is running.
|
|
196
|
+
|
|
197
|
+
Returns:
|
|
198
|
+
bool: True if docker is running; False otherwise.
|
|
199
|
+
"""
|
|
200
|
+
try:
|
|
201
|
+
client = docker.from_env()
|
|
202
|
+
client.ping()
|
|
203
|
+
return True
|
|
204
|
+
except docker.errors.DockerException:
|
|
205
|
+
return False
|
|
206
|
+
|
|
207
|
+
|
|
208
|
+
def in_docker_container() -> bool:
|
|
209
|
+
"""Check if the code is running in a docker container.
|
|
210
|
+
|
|
211
|
+
Returns:
|
|
212
|
+
bool: True if the code is running in a docker container; False otherwise.
|
|
213
|
+
"""
|
|
214
|
+
return os.path.exists("/.dockerenv")
|
|
215
|
+
|
|
216
|
+
|
|
217
|
+
def decide_use_docker(use_docker: Optional[bool]) -> Optional[bool]:
|
|
218
|
+
if use_docker is None:
|
|
219
|
+
env_var_use_docker = os.environ.get("AUTOGEN_USE_DOCKER", "True")
|
|
220
|
+
|
|
221
|
+
truthy_values = {"1", "true", "yes", "t"}
|
|
222
|
+
falsy_values = {"0", "false", "no", "f"}
|
|
223
|
+
|
|
224
|
+
# Convert the value to lowercase for case-insensitive comparison
|
|
225
|
+
env_var_use_docker_lower = env_var_use_docker.lower()
|
|
226
|
+
|
|
227
|
+
# Determine the boolean value based on the environment variable
|
|
228
|
+
if env_var_use_docker_lower in truthy_values:
|
|
229
|
+
use_docker = True
|
|
230
|
+
elif env_var_use_docker_lower in falsy_values:
|
|
231
|
+
use_docker = False
|
|
232
|
+
elif env_var_use_docker_lower == "none": # Special case for 'None' as a string
|
|
233
|
+
use_docker = None
|
|
234
|
+
else:
|
|
235
|
+
# Raise an error for any unrecognized value
|
|
236
|
+
raise ValueError(
|
|
237
|
+
f'Invalid value for AUTOGEN_USE_DOCKER: {env_var_use_docker}. Please set AUTOGEN_USE_DOCKER to "1/True/yes", "0/False/no", or "None".'
|
|
238
|
+
)
|
|
239
|
+
return use_docker
|
|
240
|
+
|
|
241
|
+
|
|
242
|
+
def check_can_use_docker_or_throw(use_docker) -> None:
|
|
243
|
+
if use_docker is not None:
|
|
244
|
+
inside_docker = in_docker_container()
|
|
245
|
+
docker_installed_and_running = is_docker_running()
|
|
246
|
+
if use_docker and not inside_docker and not docker_installed_and_running:
|
|
247
|
+
raise RuntimeError(
|
|
248
|
+
"Code execution is set to be run in docker (default behaviour) but docker is not running.\n"
|
|
249
|
+
"The options available are:\n"
|
|
250
|
+
"- Make sure docker is running (advised approach for code execution)\n"
|
|
251
|
+
'- Set "use_docker": False in code_execution_config\n'
|
|
252
|
+
'- Set AUTOGEN_USE_DOCKER to "0/False/no" in your environment variables'
|
|
253
|
+
)
|
|
254
|
+
|
|
255
|
+
|
|
256
|
+
def _sanitize_filename_for_docker_tag(filename: str) -> str:
|
|
257
|
+
"""Convert a filename to a valid docker tag.
|
|
258
|
+
See https://docs.docker.com/engine/reference/commandline/tag/ for valid tag
|
|
259
|
+
format.
|
|
260
|
+
|
|
261
|
+
Args:
|
|
262
|
+
filename (str): The filename to be converted.
|
|
263
|
+
|
|
264
|
+
Returns:
|
|
265
|
+
str: The sanitized Docker tag.
|
|
266
|
+
"""
|
|
267
|
+
# Replace any character not allowed with an underscore
|
|
268
|
+
allowed_chars = set(string.ascii_letters + string.digits + "_.-")
|
|
269
|
+
sanitized = "".join(char if char in allowed_chars else "_" for char in filename)
|
|
270
|
+
|
|
271
|
+
# Ensure it does not start with a period or a dash
|
|
272
|
+
if sanitized.startswith(".") or sanitized.startswith("-"):
|
|
273
|
+
sanitized = "_" + sanitized[1:]
|
|
274
|
+
|
|
275
|
+
# Truncate if longer than 128 characters
|
|
276
|
+
return sanitized[:128]
|
|
277
|
+
|
|
278
|
+
|
|
279
|
+
def execute_code(
|
|
280
|
+
code: Optional[str] = None,
|
|
281
|
+
timeout: Optional[int] = None,
|
|
282
|
+
filename: Optional[str] = None,
|
|
283
|
+
work_dir: Optional[str] = None,
|
|
284
|
+
use_docker: Union[list[str], str, bool] = SENTINEL,
|
|
285
|
+
lang: Optional[str] = "python",
|
|
286
|
+
) -> tuple[int, str, Optional[str]]:
|
|
287
|
+
"""Execute code in a docker container.
|
|
288
|
+
This function is not tested on MacOS.
|
|
289
|
+
|
|
290
|
+
Args:
|
|
291
|
+
code (Optional, str): The code to execute.
|
|
292
|
+
If None, the code from the file specified by filename will be executed.
|
|
293
|
+
Either code or filename must be provided.
|
|
294
|
+
timeout (Optional, int): The maximum execution time in seconds.
|
|
295
|
+
If None, a default timeout will be used. The default timeout is 600 seconds. On Windows, the timeout is not enforced when use_docker=False.
|
|
296
|
+
filename (Optional, str): The file name to save the code or where the code is stored when `code` is None.
|
|
297
|
+
If None, a file with a randomly generated name will be created.
|
|
298
|
+
The randomly generated file will be deleted after execution.
|
|
299
|
+
The file name must be a relative path. Relative paths are relative to the working directory.
|
|
300
|
+
work_dir (Optional, str): The working directory for the code execution.
|
|
301
|
+
If None, a default working directory will be used.
|
|
302
|
+
The default working directory is the "extensions" directory under
|
|
303
|
+
"path_to_autogen".
|
|
304
|
+
use_docker (list, str or bool): The docker image to use for code execution.
|
|
305
|
+
Default is True, which means the code will be executed in a docker container. A default list of images will be used.
|
|
306
|
+
If a list or a str of image name(s) is provided, the code will be executed in a docker container
|
|
307
|
+
with the first image successfully pulled.
|
|
308
|
+
If False, the code will be executed in the current environment.
|
|
309
|
+
Expected behaviour:
|
|
310
|
+
- If `use_docker` is not set (i.e. left default to True) or is explicitly set to True and the docker package is available, the code will run in a Docker container.
|
|
311
|
+
- If `use_docker` is not set (i.e. left default to True) or is explicitly set to True but the Docker package is missing or docker isn't running, an error will be raised.
|
|
312
|
+
- If `use_docker` is explicitly set to False, the code will run natively.
|
|
313
|
+
If the code is executed in the current environment,
|
|
314
|
+
the code must be trusted.
|
|
315
|
+
lang (Optional, str): The language of the code. Default is "python".
|
|
316
|
+
|
|
317
|
+
Returns:
|
|
318
|
+
int: 0 if the code executes successfully.
|
|
319
|
+
str: The error message if the code fails to execute; the stdout otherwise.
|
|
320
|
+
image: The docker image name after container run when docker is used.
|
|
321
|
+
"""
|
|
322
|
+
if all((code is None, filename is None)):
|
|
323
|
+
error_msg = f"Either {code=} or {filename=} must be provided."
|
|
324
|
+
logger.error(error_msg)
|
|
325
|
+
raise AssertionError(error_msg)
|
|
326
|
+
|
|
327
|
+
running_inside_docker = in_docker_container()
|
|
328
|
+
docker_running = is_docker_running()
|
|
329
|
+
|
|
330
|
+
# SENTINEL is used to indicate that the user did not explicitly set the argument
|
|
331
|
+
if use_docker is SENTINEL:
|
|
332
|
+
use_docker = decide_use_docker(use_docker=None)
|
|
333
|
+
check_can_use_docker_or_throw(use_docker)
|
|
334
|
+
|
|
335
|
+
timeout = timeout or DEFAULT_TIMEOUT
|
|
336
|
+
original_filename = filename
|
|
337
|
+
if WIN32 and lang in ["sh", "shell"] and (not use_docker):
|
|
338
|
+
lang = "ps1"
|
|
339
|
+
if filename is None:
|
|
340
|
+
code_hash = md5(code.encode()).hexdigest()
|
|
341
|
+
# create a file with a automatically generated name
|
|
342
|
+
filename = f"tmp_code_{code_hash}.{'py' if lang.startswith('python') else lang}"
|
|
343
|
+
if work_dir is None:
|
|
344
|
+
work_dir = WORKING_DIR
|
|
345
|
+
|
|
346
|
+
filepath = os.path.join(work_dir, filename)
|
|
347
|
+
file_dir = os.path.dirname(filepath)
|
|
348
|
+
os.makedirs(file_dir, exist_ok=True)
|
|
349
|
+
|
|
350
|
+
if code is not None:
|
|
351
|
+
with open(filepath, "w", encoding="utf-8") as fout:
|
|
352
|
+
fout.write(code)
|
|
353
|
+
|
|
354
|
+
if not use_docker or running_inside_docker:
|
|
355
|
+
# already running in a docker container
|
|
356
|
+
cmd = [
|
|
357
|
+
sys.executable if lang.startswith("python") else _cmd(lang),
|
|
358
|
+
f".\\{filename}" if WIN32 else filename,
|
|
359
|
+
]
|
|
360
|
+
with ThreadPoolExecutor(max_workers=1) as executor:
|
|
361
|
+
future = executor.submit(
|
|
362
|
+
subprocess.run,
|
|
363
|
+
cmd,
|
|
364
|
+
cwd=work_dir,
|
|
365
|
+
capture_output=True,
|
|
366
|
+
text=True,
|
|
367
|
+
)
|
|
368
|
+
try:
|
|
369
|
+
result = future.result(timeout=timeout)
|
|
370
|
+
except TimeoutError:
|
|
371
|
+
if original_filename is None:
|
|
372
|
+
os.remove(filepath)
|
|
373
|
+
return 1, TIMEOUT_MSG, None
|
|
374
|
+
if original_filename is None:
|
|
375
|
+
os.remove(filepath)
|
|
376
|
+
if result.returncode:
|
|
377
|
+
logs = result.stderr
|
|
378
|
+
if original_filename is None:
|
|
379
|
+
abs_path = str(pathlib.Path(filepath).absolute())
|
|
380
|
+
logs = logs.replace(str(abs_path), "").replace(filename, "")
|
|
381
|
+
else:
|
|
382
|
+
abs_path = str(pathlib.Path(work_dir).absolute()) + PATH_SEPARATOR
|
|
383
|
+
logs = logs.replace(str(abs_path), "")
|
|
384
|
+
else:
|
|
385
|
+
logs = result.stdout
|
|
386
|
+
return result.returncode, logs, None
|
|
387
|
+
|
|
388
|
+
# create a docker client
|
|
389
|
+
if use_docker and not docker_running:
|
|
390
|
+
raise RuntimeError(
|
|
391
|
+
"Docker package is missing or docker is not running. Please make sure docker is running or set use_docker=False."
|
|
392
|
+
)
|
|
393
|
+
|
|
394
|
+
client = docker.from_env()
|
|
395
|
+
|
|
396
|
+
image_list = (
|
|
397
|
+
["python:3-slim", "python:3", "python:3-windowsservercore"]
|
|
398
|
+
if use_docker is True
|
|
399
|
+
else [use_docker]
|
|
400
|
+
if isinstance(use_docker, str)
|
|
401
|
+
else use_docker
|
|
402
|
+
)
|
|
403
|
+
for image in image_list:
|
|
404
|
+
# check if the image exists
|
|
405
|
+
try:
|
|
406
|
+
client.images.get(image)
|
|
407
|
+
break
|
|
408
|
+
except docker.errors.ImageNotFound:
|
|
409
|
+
# pull the image
|
|
410
|
+
print("Pulling image", image)
|
|
411
|
+
try:
|
|
412
|
+
client.images.pull(image)
|
|
413
|
+
break
|
|
414
|
+
except docker.errors.DockerException:
|
|
415
|
+
print("Failed to pull image", image)
|
|
416
|
+
# get a randomized str based on current time to wrap the exit code
|
|
417
|
+
exit_code_str = f"exitcode{time.time()}"
|
|
418
|
+
abs_path = pathlib.Path(work_dir).absolute()
|
|
419
|
+
cmd = [
|
|
420
|
+
"sh",
|
|
421
|
+
"-c",
|
|
422
|
+
f'{_cmd(lang)} "{filename}"; exit_code=$?; echo -n {exit_code_str}; echo -n $exit_code; echo {exit_code_str}',
|
|
423
|
+
]
|
|
424
|
+
# create a docker container
|
|
425
|
+
container = client.containers.run(
|
|
426
|
+
image,
|
|
427
|
+
command=cmd,
|
|
428
|
+
working_dir="/workspace",
|
|
429
|
+
detach=True,
|
|
430
|
+
# get absolute path to the working directory
|
|
431
|
+
volumes={abs_path: {"bind": "/workspace", "mode": "rw"}},
|
|
432
|
+
)
|
|
433
|
+
start_time = time.time()
|
|
434
|
+
while container.status != "exited" and time.time() - start_time < timeout:
|
|
435
|
+
# Reload the container object
|
|
436
|
+
container.reload()
|
|
437
|
+
if container.status != "exited":
|
|
438
|
+
container.stop()
|
|
439
|
+
container.remove()
|
|
440
|
+
if original_filename is None:
|
|
441
|
+
os.remove(filepath)
|
|
442
|
+
return 1, TIMEOUT_MSG, image
|
|
443
|
+
# get the container logs
|
|
444
|
+
logs = container.logs().decode("utf-8").rstrip()
|
|
445
|
+
# commit the image
|
|
446
|
+
tag = _sanitize_filename_for_docker_tag(filename)
|
|
447
|
+
container.commit(repository="python", tag=tag)
|
|
448
|
+
# remove the container
|
|
449
|
+
container.remove()
|
|
450
|
+
# check if the code executed successfully
|
|
451
|
+
exit_code = container.attrs["State"]["ExitCode"]
|
|
452
|
+
if exit_code == 0:
|
|
453
|
+
# extract the exit code from the logs
|
|
454
|
+
pattern = re.compile(f"{exit_code_str}(\\d+){exit_code_str}")
|
|
455
|
+
match = pattern.search(logs)
|
|
456
|
+
exit_code = 1 if match is None else int(match.group(1))
|
|
457
|
+
# remove the exit code from the logs
|
|
458
|
+
logs = logs if match is None else pattern.sub("", logs)
|
|
459
|
+
|
|
460
|
+
if original_filename is None:
|
|
461
|
+
os.remove(filepath)
|
|
462
|
+
if exit_code:
|
|
463
|
+
logs = logs.replace(f"/workspace/{filename if original_filename is None else ''}", "")
|
|
464
|
+
# return the exit code, logs and image
|
|
465
|
+
return exit_code, logs, f"python:{tag}"
|
|
466
|
+
|
|
467
|
+
|
|
468
|
+
_GENERATE_ASSERTIONS_CONFIG = {
|
|
469
|
+
"prompt": """Given the signature and docstring, write the exactly same number of assertion(s) for the provided example(s) in the docstring, without assertion messages.
|
|
470
|
+
|
|
471
|
+
func signature:
|
|
472
|
+
{definition}
|
|
473
|
+
assertions:""",
|
|
474
|
+
"model": FAST_MODEL,
|
|
475
|
+
"max_tokens": 256,
|
|
476
|
+
"stop": "\n\n",
|
|
477
|
+
}
|
|
478
|
+
|
|
479
|
+
|
|
480
|
+
def _remove_check(response):
|
|
481
|
+
"""Remove the check function from the response."""
|
|
482
|
+
# find the position of the check function
|
|
483
|
+
pos = response.find("def check(")
|
|
484
|
+
if pos == -1:
|
|
485
|
+
return response
|
|
486
|
+
return response[:pos]
|
|
487
|
+
|
|
488
|
+
|
|
489
|
+
def eval_function_completions(
|
|
490
|
+
responses: list[str],
|
|
491
|
+
definition: str,
|
|
492
|
+
test: Optional[str] = None,
|
|
493
|
+
entry_point: Optional[str] = None,
|
|
494
|
+
assertions: Optional[Union[str, Callable[[str], tuple[str, float]]]] = None,
|
|
495
|
+
timeout: Optional[float] = 3,
|
|
496
|
+
use_docker: Optional[bool] = True,
|
|
497
|
+
) -> dict:
|
|
498
|
+
"""`(openai<1)` Select a response from a list of responses for the function completion task (using generated assertions), and/or evaluate if the task is successful using a gold test.
|
|
499
|
+
|
|
500
|
+
Args:
|
|
501
|
+
responses: The list of responses.
|
|
502
|
+
definition: The input definition.
|
|
503
|
+
test: The test code.
|
|
504
|
+
entry_point: The name of the function.
|
|
505
|
+
assertions: The assertion code which serves as a filter of the responses, or an assertion generator.
|
|
506
|
+
When provided, only the responses that pass the assertions will be considered for the actual test (if provided).
|
|
507
|
+
timeout: The timeout for executing the code.
|
|
508
|
+
use_docker: Whether to use docker for code execution.
|
|
509
|
+
|
|
510
|
+
Returns:
|
|
511
|
+
dict: The success metrics.
|
|
512
|
+
"""
|
|
513
|
+
n = len(responses)
|
|
514
|
+
if assertions is None:
|
|
515
|
+
# no assertion filter
|
|
516
|
+
success_list = []
|
|
517
|
+
for i in range(n):
|
|
518
|
+
response = _remove_check(responses[i])
|
|
519
|
+
code = (
|
|
520
|
+
f"{response}\n{test}\ncheck({entry_point})"
|
|
521
|
+
if response.startswith("def")
|
|
522
|
+
else f"{definition}{response}\n{test}\ncheck({entry_point})"
|
|
523
|
+
)
|
|
524
|
+
success = execute_code(code, timeout=timeout, use_docker=use_docker)[0] == 0
|
|
525
|
+
success_list.append(success)
|
|
526
|
+
return {
|
|
527
|
+
"expected_success": 1 - pow(1 - sum(success_list) / n, n),
|
|
528
|
+
"success": any(s for s in success_list),
|
|
529
|
+
}
|
|
530
|
+
if callable(assertions) and n > 1:
|
|
531
|
+
# assertion generator
|
|
532
|
+
assertions, gen_cost = assertions(definition)
|
|
533
|
+
else:
|
|
534
|
+
assertions, gen_cost = None, 0
|
|
535
|
+
if n > 1 or test is None:
|
|
536
|
+
for i in range(n):
|
|
537
|
+
response = responses[i] = _remove_check(responses[i])
|
|
538
|
+
code = (
|
|
539
|
+
f"{response}\n{assertions}" if response.startswith("def") else f"{definition}{response}\n{assertions}"
|
|
540
|
+
)
|
|
541
|
+
succeed_assertions = execute_code(code, timeout=timeout, use_docker=use_docker)[0] == 0
|
|
542
|
+
if succeed_assertions:
|
|
543
|
+
break
|
|
544
|
+
else:
|
|
545
|
+
# just test, no need to check assertions
|
|
546
|
+
succeed_assertions = False
|
|
547
|
+
i, response = 0, responses[0]
|
|
548
|
+
if test is None:
|
|
549
|
+
# no test code
|
|
550
|
+
return {
|
|
551
|
+
"index_selected": i,
|
|
552
|
+
"succeed_assertions": succeed_assertions,
|
|
553
|
+
"gen_cost": gen_cost,
|
|
554
|
+
"assertions": assertions,
|
|
555
|
+
}
|
|
556
|
+
code_test = (
|
|
557
|
+
f"{response}\n{test}\ncheck({entry_point})"
|
|
558
|
+
if response.startswith("def")
|
|
559
|
+
else f"{definition}{response}\n{test}\ncheck({entry_point})"
|
|
560
|
+
)
|
|
561
|
+
success = execute_code(code_test, timeout=timeout, use_docker=use_docker)[0] == 0
|
|
562
|
+
return {
|
|
563
|
+
"index_selected": i,
|
|
564
|
+
"succeed_assertions": succeed_assertions,
|
|
565
|
+
"success": success,
|
|
566
|
+
"gen_cost": gen_cost,
|
|
567
|
+
"assertions": assertions,
|
|
568
|
+
}
|
|
569
|
+
|
|
570
|
+
|
|
571
|
+
_FUNC_COMPLETION_PROMPT = "# Python 3{definition}"
|
|
572
|
+
_FUNC_COMPLETION_STOP = ["\nclass", "\ndef", "\nif", "\nprint"]
|
|
573
|
+
_IMPLEMENT_CONFIGS = [
|
|
574
|
+
{"model": FAST_MODEL, "prompt": _FUNC_COMPLETION_PROMPT, "temperature": 0, "cache_seed": 0},
|
|
575
|
+
{"model": FAST_MODEL, "prompt": _FUNC_COMPLETION_PROMPT, "stop": _FUNC_COMPLETION_STOP, "n": 7, "cache_seed": 0},
|
|
576
|
+
{"model": DEFAULT_MODEL, "prompt": _FUNC_COMPLETION_PROMPT, "temperature": 0, "cache_seed": 1},
|
|
577
|
+
{"model": DEFAULT_MODEL, "prompt": _FUNC_COMPLETION_PROMPT, "stop": _FUNC_COMPLETION_STOP, "n": 2, "cache_seed": 2},
|
|
578
|
+
{"model": DEFAULT_MODEL, "prompt": _FUNC_COMPLETION_PROMPT, "stop": _FUNC_COMPLETION_STOP, "n": 1, "cache_seed": 2},
|
|
579
|
+
]
|
|
580
|
+
|
|
581
|
+
|
|
582
|
+
def create_virtual_env(dir_path: str, **env_args) -> SimpleNamespace:
|
|
583
|
+
"""Creates a python virtual environment and returns the context.
|
|
584
|
+
|
|
585
|
+
Args:
|
|
586
|
+
dir_path (str): Directory path where the env will be created.
|
|
587
|
+
**env_args: Any extra args to pass to the `EnvBuilder`
|
|
588
|
+
|
|
589
|
+
Returns:
|
|
590
|
+
SimpleNamespace: the virtual env context object.
|
|
591
|
+
"""
|
|
592
|
+
if not env_args:
|
|
593
|
+
env_args = {"with_pip": True}
|
|
594
|
+
env_builder = venv.EnvBuilder(**env_args)
|
|
595
|
+
env_builder.create(dir_path)
|
|
596
|
+
return env_builder.ensure_directories(dir_path)
|
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
# Copyright (c) 2023 - 2025, AG2ai, Inc., AG2ai open-source projects maintainers and core contributors
|
|
2
|
+
#
|
|
3
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
4
|
+
#
|
|
5
|
+
# Original portions of this file are derived from https://github.com/microsoft/autogen under the MIT License.
|
|
6
|
+
# SPDX-License-Identifier: MIT
|
|
7
|
+
from .base import CodeBlock, CodeExecutor, CodeExtractor, CodeResult
|
|
8
|
+
from .docker_commandline_code_executor import DockerCommandLineCodeExecutor
|
|
9
|
+
from .factory import CodeExecutorFactory
|
|
10
|
+
from .local_commandline_code_executor import LocalCommandLineCodeExecutor
|
|
11
|
+
from .markdown_code_extractor import MarkdownCodeExtractor
|
|
12
|
+
|
|
13
|
+
__all__ = (
|
|
14
|
+
"CodeBlock",
|
|
15
|
+
"CodeExecutor",
|
|
16
|
+
"CodeExecutorFactory",
|
|
17
|
+
"CodeExtractor",
|
|
18
|
+
"CodeResult",
|
|
19
|
+
"DockerCommandLineCodeExecutor",
|
|
20
|
+
"LocalCommandLineCodeExecutor",
|
|
21
|
+
"MarkdownCodeExtractor",
|
|
22
|
+
)
|