PyPI - autobyteus - Versions diffs - 1.2.1__py3-none-any.whl → 1.2.3__py3-none-any.whl - Mend

autobyteus 1.2.1py3-none-any.whl → 1.2.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (466) hide show

autobyteus/agent/agent.py +15 -5
autobyteus/agent/bootstrap_steps/__init__.py +1 -3
autobyteus/agent/bootstrap_steps/agent_bootstrapper.py +3 -59
autobyteus/agent/bootstrap_steps/base_bootstrap_step.py +1 -4
autobyteus/agent/bootstrap_steps/mcp_server_prewarming_step.py +1 -3
autobyteus/agent/bootstrap_steps/system_prompt_processing_step.py +16 -13
autobyteus/agent/bootstrap_steps/workspace_context_initialization_step.py +2 -4
autobyteus/agent/context/agent_config.py +43 -20
autobyteus/agent/context/agent_context.py +23 -18
autobyteus/agent/context/agent_runtime_state.py +19 -19
autobyteus/agent/events/__init__.py +16 -1
autobyteus/agent/events/agent_events.py +43 -3
autobyteus/agent/events/agent_input_event_queue_manager.py +79 -26
autobyteus/agent/events/event_store.py +57 -0
autobyteus/agent/events/notifiers.py +69 -59
autobyteus/agent/events/worker_event_dispatcher.py +21 -64
autobyteus/agent/factory/agent_factory.py +52 -0
autobyteus/agent/handlers/__init__.py +2 -0
autobyteus/agent/handlers/approved_tool_invocation_event_handler.py +51 -34
autobyteus/agent/handlers/bootstrap_event_handler.py +155 -0
autobyteus/agent/handlers/inter_agent_message_event_handler.py +10 -0
autobyteus/agent/handlers/lifecycle_event_logger.py +19 -11
autobyteus/agent/handlers/llm_complete_response_received_event_handler.py +10 -15
autobyteus/agent/handlers/llm_user_message_ready_event_handler.py +188 -48
autobyteus/agent/handlers/tool_execution_approval_event_handler.py +0 -10
autobyteus/agent/handlers/tool_invocation_request_event_handler.py +53 -48
autobyteus/agent/handlers/tool_result_event_handler.py +7 -8
autobyteus/agent/handlers/user_input_message_event_handler.py +10 -3
autobyteus/agent/input_processor/memory_ingest_input_processor.py +40 -0
autobyteus/agent/lifecycle/__init__.py +12 -0
autobyteus/agent/lifecycle/base_processor.py +109 -0
autobyteus/agent/lifecycle/events.py +35 -0
autobyteus/agent/lifecycle/processor_definition.py +36 -0
autobyteus/agent/lifecycle/processor_registry.py +106 -0
autobyteus/agent/llm_request_assembler.py +98 -0
autobyteus/agent/llm_response_processor/__init__.py +1 -8
autobyteus/agent/message/context_file_type.py +1 -1
autobyteus/agent/runtime/agent_runtime.py +29 -21
autobyteus/agent/runtime/agent_worker.py +98 -19
autobyteus/agent/shutdown_steps/__init__.py +2 -0
autobyteus/agent/shutdown_steps/agent_shutdown_orchestrator.py +2 -0
autobyteus/agent/shutdown_steps/tool_cleanup_step.py +58 -0
autobyteus/agent/status/__init__.py +14 -0
autobyteus/agent/status/manager.py +93 -0
autobyteus/agent/status/status_deriver.py +96 -0
autobyteus/agent/{phases/phase_enum.py → status/status_enum.py} +16 -16
autobyteus/agent/status/status_update_utils.py +73 -0
autobyteus/agent/streaming/__init__.py +52 -5
autobyteus/agent/streaming/adapters/__init__.py +18 -0
autobyteus/agent/streaming/adapters/invocation_adapter.py +184 -0
autobyteus/agent/streaming/adapters/tool_call_parsing.py +163 -0
autobyteus/agent/streaming/adapters/tool_syntax_registry.py +67 -0
autobyteus/agent/streaming/agent_event_stream.py +3 -183
autobyteus/agent/streaming/api_tool_call/__init__.py +16 -0
autobyteus/agent/streaming/api_tool_call/file_content_streamer.py +56 -0
autobyteus/agent/streaming/api_tool_call/json_string_field_extractor.py +175 -0
autobyteus/agent/streaming/api_tool_call_streaming_response_handler.py +4 -0
autobyteus/agent/streaming/events/__init__.py +6 -0
autobyteus/agent/streaming/events/stream_event_payloads.py +284 -0
autobyteus/agent/streaming/events/stream_events.py +141 -0
autobyteus/agent/streaming/handlers/__init__.py +15 -0
autobyteus/agent/streaming/handlers/api_tool_call_streaming_response_handler.py +303 -0
autobyteus/agent/streaming/handlers/parsing_streaming_response_handler.py +107 -0
autobyteus/agent/streaming/handlers/pass_through_streaming_response_handler.py +107 -0
autobyteus/agent/streaming/handlers/streaming_handler_factory.py +177 -0
autobyteus/agent/streaming/handlers/streaming_response_handler.py +58 -0
autobyteus/agent/streaming/parser/__init__.py +61 -0
autobyteus/agent/streaming/parser/event_emitter.py +181 -0
autobyteus/agent/streaming/parser/events.py +4 -0
autobyteus/agent/streaming/parser/invocation_adapter.py +4 -0
autobyteus/agent/streaming/parser/json_parsing_strategies/__init__.py +19 -0
autobyteus/agent/streaming/parser/json_parsing_strategies/base.py +32 -0
autobyteus/agent/streaming/parser/json_parsing_strategies/default.py +34 -0
autobyteus/agent/streaming/parser/json_parsing_strategies/gemini.py +31 -0
autobyteus/agent/streaming/parser/json_parsing_strategies/openai.py +64 -0
autobyteus/agent/streaming/parser/json_parsing_strategies/registry.py +75 -0
autobyteus/agent/streaming/parser/parser_context.py +227 -0
autobyteus/agent/streaming/parser/parser_factory.py +132 -0
autobyteus/agent/streaming/parser/sentinel_format.py +7 -0
autobyteus/agent/streaming/parser/state_factory.py +62 -0
autobyteus/agent/streaming/parser/states/__init__.py +1 -0
autobyteus/agent/streaming/parser/states/base_state.py +60 -0
autobyteus/agent/streaming/parser/states/custom_xml_tag_run_bash_parsing_state.py +38 -0
autobyteus/agent/streaming/parser/states/custom_xml_tag_write_file_parsing_state.py +55 -0
autobyteus/agent/streaming/parser/states/delimited_content_state.py +146 -0
autobyteus/agent/streaming/parser/states/json_initialization_state.py +144 -0
autobyteus/agent/streaming/parser/states/json_tool_parsing_state.py +137 -0
autobyteus/agent/streaming/parser/states/sentinel_content_state.py +30 -0
autobyteus/agent/streaming/parser/states/sentinel_initialization_state.py +117 -0
autobyteus/agent/streaming/parser/states/text_state.py +78 -0
autobyteus/agent/streaming/parser/states/xml_patch_file_tool_parsing_state.py +328 -0
autobyteus/agent/streaming/parser/states/xml_run_bash_tool_parsing_state.py +129 -0
autobyteus/agent/streaming/parser/states/xml_tag_initialization_state.py +151 -0
autobyteus/agent/streaming/parser/states/xml_tool_parsing_state.py +63 -0
autobyteus/agent/streaming/parser/states/xml_write_file_tool_parsing_state.py +343 -0
autobyteus/agent/streaming/parser/strategies/__init__.py +17 -0
autobyteus/agent/streaming/parser/strategies/base.py +24 -0
autobyteus/agent/streaming/parser/strategies/json_tool_strategy.py +26 -0
autobyteus/agent/streaming/parser/strategies/registry.py +28 -0
autobyteus/agent/streaming/parser/strategies/sentinel_strategy.py +23 -0
autobyteus/agent/streaming/parser/strategies/xml_tag_strategy.py +21 -0
autobyteus/agent/streaming/parser/stream_scanner.py +167 -0
autobyteus/agent/streaming/parser/streaming_parser.py +212 -0
autobyteus/agent/streaming/parser/tool_call_parsing.py +4 -0
autobyteus/agent/streaming/parser/tool_constants.py +7 -0
autobyteus/agent/streaming/parser/tool_syntax_registry.py +4 -0
autobyteus/agent/streaming/parser/xml_tool_parsing_state_registry.py +55 -0
autobyteus/agent/streaming/parsing_streaming_response_handler.py +4 -0
autobyteus/agent/streaming/pass_through_streaming_response_handler.py +4 -0
autobyteus/agent/streaming/queue_streamer.py +3 -57
autobyteus/agent/streaming/segments/__init__.py +5 -0
autobyteus/agent/streaming/segments/segment_events.py +81 -0
autobyteus/agent/streaming/stream_event_payloads.py +2 -223
autobyteus/agent/streaming/stream_events.py +3 -140
autobyteus/agent/streaming/streaming_handler_factory.py +4 -0
autobyteus/agent/streaming/streaming_response_handler.py +4 -0
autobyteus/agent/streaming/streams/__init__.py +5 -0
autobyteus/agent/streaming/streams/agent_event_stream.py +197 -0
autobyteus/agent/streaming/utils/__init__.py +5 -0
autobyteus/agent/streaming/utils/queue_streamer.py +59 -0
autobyteus/agent/system_prompt_processor/__init__.py +2 -0
autobyteus/agent/system_prompt_processor/available_skills_processor.py +96 -0
autobyteus/agent/system_prompt_processor/base_processor.py +1 -1
autobyteus/agent/system_prompt_processor/processor_meta.py +15 -2
autobyteus/agent/system_prompt_processor/tool_manifest_injector_processor.py +39 -58
autobyteus/agent/token_budget.py +56 -0
autobyteus/agent/tool_execution_result_processor/memory_ingest_tool_result_processor.py +29 -0
autobyteus/agent/tool_invocation.py +16 -40
autobyteus/agent/tool_invocation_preprocessor/__init__.py +9 -0
autobyteus/agent/tool_invocation_preprocessor/base_preprocessor.py +45 -0
autobyteus/agent/tool_invocation_preprocessor/processor_definition.py +15 -0
autobyteus/agent/tool_invocation_preprocessor/processor_meta.py +33 -0
autobyteus/agent/tool_invocation_preprocessor/processor_registry.py +60 -0
autobyteus/agent/utils/wait_for_idle.py +12 -14
autobyteus/agent/workspace/base_workspace.py +6 -27
autobyteus/agent_team/agent_team.py +3 -3
autobyteus/agent_team/agent_team_builder.py +1 -41
autobyteus/agent_team/bootstrap_steps/__init__.py +0 -4
autobyteus/agent_team/bootstrap_steps/agent_configuration_preparation_step.py +8 -18
autobyteus/agent_team/bootstrap_steps/agent_team_bootstrapper.py +4 -16
autobyteus/agent_team/bootstrap_steps/base_agent_team_bootstrap_step.py +1 -2
autobyteus/agent_team/bootstrap_steps/coordinator_initialization_step.py +1 -2
autobyteus/agent_team/bootstrap_steps/task_notifier_initialization_step.py +1 -2
autobyteus/agent_team/bootstrap_steps/team_context_initialization_step.py +4 -4
autobyteus/agent_team/context/agent_team_config.py +6 -3
autobyteus/agent_team/context/agent_team_context.py +25 -3
autobyteus/agent_team/context/agent_team_runtime_state.py +9 -6
autobyteus/agent_team/events/__init__.py +11 -0
autobyteus/agent_team/events/agent_team_event_dispatcher.py +22 -9
autobyteus/agent_team/events/agent_team_events.py +16 -0
autobyteus/agent_team/events/event_store.py +57 -0
autobyteus/agent_team/factory/agent_team_factory.py +8 -0
autobyteus/agent_team/handlers/inter_agent_message_request_event_handler.py +18 -2
autobyteus/agent_team/handlers/lifecycle_agent_team_event_handler.py +21 -5
autobyteus/agent_team/handlers/process_user_message_event_handler.py +17 -8
autobyteus/agent_team/handlers/tool_approval_team_event_handler.py +19 -4
autobyteus/agent_team/runtime/agent_team_runtime.py +41 -10
autobyteus/agent_team/runtime/agent_team_worker.py +69 -5
autobyteus/agent_team/status/__init__.py +14 -0
autobyteus/agent_team/status/agent_team_status.py +18 -0
autobyteus/agent_team/status/agent_team_status_manager.py +33 -0
autobyteus/agent_team/status/status_deriver.py +62 -0
autobyteus/agent_team/status/status_update_utils.py +42 -0
autobyteus/agent_team/streaming/__init__.py +2 -2
autobyteus/agent_team/streaming/agent_team_event_notifier.py +6 -6
autobyteus/agent_team/streaming/agent_team_stream_event_payloads.py +4 -4
autobyteus/agent_team/streaming/agent_team_stream_events.py +3 -3
autobyteus/agent_team/system_prompt_processor/__init__.py +6 -0
autobyteus/agent_team/system_prompt_processor/team_manifest_injector_processor.py +76 -0
autobyteus/agent_team/task_notification/task_notification_mode.py +19 -0
autobyteus/agent_team/utils/wait_for_idle.py +4 -4
autobyteus/cli/agent_cli.py +18 -10
autobyteus/cli/agent_team_tui/app.py +14 -11
autobyteus/cli/agent_team_tui/state.py +13 -15
autobyteus/cli/agent_team_tui/widgets/agent_list_sidebar.py +15 -15
autobyteus/cli/agent_team_tui/widgets/focus_pane.py +143 -36
autobyteus/cli/agent_team_tui/widgets/renderables.py +1 -1
autobyteus/cli/agent_team_tui/widgets/shared.py +25 -25
autobyteus/cli/cli_display.py +193 -44
autobyteus/cli/workflow_tui/app.py +9 -10
autobyteus/cli/workflow_tui/state.py +14 -16
autobyteus/cli/workflow_tui/widgets/agent_list_sidebar.py +15 -15
autobyteus/cli/workflow_tui/widgets/focus_pane.py +137 -35
autobyteus/cli/workflow_tui/widgets/renderables.py +1 -1
autobyteus/cli/workflow_tui/widgets/shared.py +25 -25
autobyteus/clients/autobyteus_client.py +94 -1
autobyteus/events/event_types.py +11 -18
autobyteus/llm/api/autobyteus_llm.py +33 -29
autobyteus/llm/api/claude_llm.py +142 -36
autobyteus/llm/api/gemini_llm.py +163 -59
autobyteus/llm/api/grok_llm.py +1 -1
autobyteus/llm/api/minimax_llm.py +26 -0
autobyteus/llm/api/mistral_llm.py +113 -87
autobyteus/llm/api/ollama_llm.py +9 -42
autobyteus/llm/api/openai_compatible_llm.py +127 -91
autobyteus/llm/api/openai_llm.py +3 -3
autobyteus/llm/api/openai_responses_llm.py +324 -0
autobyteus/llm/api/zhipu_llm.py +21 -2
autobyteus/llm/autobyteus_provider.py +70 -60
autobyteus/llm/base_llm.py +85 -81
autobyteus/llm/converters/__init__.py +14 -0
autobyteus/llm/converters/anthropic_tool_call_converter.py +37 -0
autobyteus/llm/converters/gemini_tool_call_converter.py +57 -0
autobyteus/llm/converters/mistral_tool_call_converter.py +37 -0
autobyteus/llm/converters/openai_tool_call_converter.py +38 -0
autobyteus/llm/extensions/base_extension.py +6 -12
autobyteus/llm/extensions/token_usage_tracking_extension.py +45 -18
autobyteus/llm/llm_factory.py +282 -204
autobyteus/llm/lmstudio_provider.py +60 -49
autobyteus/llm/models.py +35 -2
autobyteus/llm/ollama_provider.py +60 -49
autobyteus/llm/ollama_provider_resolver.py +0 -1
autobyteus/llm/prompt_renderers/__init__.py +19 -0
autobyteus/llm/prompt_renderers/anthropic_prompt_renderer.py +104 -0
autobyteus/llm/prompt_renderers/autobyteus_prompt_renderer.py +19 -0
autobyteus/llm/prompt_renderers/base_prompt_renderer.py +10 -0
autobyteus/llm/prompt_renderers/gemini_prompt_renderer.py +63 -0
autobyteus/llm/prompt_renderers/mistral_prompt_renderer.py +87 -0
autobyteus/llm/prompt_renderers/ollama_prompt_renderer.py +51 -0
autobyteus/llm/prompt_renderers/openai_chat_renderer.py +97 -0
autobyteus/llm/prompt_renderers/openai_responses_renderer.py +101 -0
autobyteus/llm/providers.py +1 -3
autobyteus/llm/token_counter/claude_token_counter.py +56 -25
autobyteus/llm/token_counter/mistral_token_counter.py +12 -8
autobyteus/llm/token_counter/openai_token_counter.py +24 -5
autobyteus/llm/token_counter/token_counter_factory.py +12 -5
autobyteus/llm/utils/llm_config.py +6 -12
autobyteus/llm/utils/media_payload_formatter.py +27 -20
autobyteus/llm/utils/messages.py +55 -3
autobyteus/llm/utils/response_types.py +3 -0
autobyteus/llm/utils/tool_call_delta.py +31 -0
autobyteus/memory/__init__.py +32 -0
autobyteus/memory/active_transcript.py +69 -0
autobyteus/memory/compaction/__init__.py +9 -0
autobyteus/memory/compaction/compaction_result.py +8 -0
autobyteus/memory/compaction/compactor.py +89 -0
autobyteus/memory/compaction/summarizer.py +11 -0
autobyteus/memory/compaction_snapshot_builder.py +84 -0
autobyteus/memory/memory_manager.py +183 -0
autobyteus/memory/models/__init__.py +14 -0
autobyteus/memory/models/episodic_item.py +41 -0
autobyteus/memory/models/memory_types.py +7 -0
autobyteus/memory/models/raw_trace_item.py +79 -0
autobyteus/memory/models/semantic_item.py +41 -0
autobyteus/memory/models/tool_interaction.py +20 -0
autobyteus/memory/policies/__init__.py +5 -0
autobyteus/memory/policies/compaction_policy.py +16 -0
autobyteus/memory/retrieval/__init__.py +7 -0
autobyteus/memory/retrieval/memory_bundle.py +11 -0
autobyteus/memory/retrieval/retriever.py +13 -0
autobyteus/memory/store/__init__.py +7 -0
autobyteus/memory/store/base_store.py +14 -0
autobyteus/memory/store/file_store.py +98 -0
autobyteus/memory/tool_interaction_builder.py +46 -0
autobyteus/memory/turn_tracker.py +9 -0
autobyteus/multimedia/audio/api/autobyteus_audio_client.py +19 -5
autobyteus/multimedia/audio/api/gemini_audio_client.py +108 -16
autobyteus/multimedia/audio/audio_client_factory.py +47 -9
autobyteus/multimedia/audio/audio_model.py +2 -1
autobyteus/multimedia/image/api/autobyteus_image_client.py +19 -5
autobyteus/multimedia/image/api/gemini_image_client.py +38 -17
autobyteus/multimedia/image/api/openai_image_client.py +125 -43
autobyteus/multimedia/image/autobyteus_image_provider.py +2 -1
autobyteus/multimedia/image/image_client_factory.py +47 -15
autobyteus/multimedia/image/image_model.py +5 -2
autobyteus/multimedia/providers.py +3 -2
autobyteus/skills/loader.py +71 -0
autobyteus/skills/model.py +11 -0
autobyteus/skills/registry.py +70 -0
autobyteus/task_management/tools/todo_tools/add_todo.py +2 -2
autobyteus/task_management/tools/todo_tools/create_todo_list.py +2 -2
autobyteus/task_management/tools/todo_tools/update_todo_status.py +2 -2
autobyteus/tools/__init__.py +34 -47
autobyteus/tools/base_tool.py +7 -0
autobyteus/tools/file/__init__.py +2 -6
autobyteus/tools/file/patch_file.py +149 -0
autobyteus/tools/file/read_file.py +36 -5
autobyteus/tools/file/write_file.py +4 -1
autobyteus/tools/functional_tool.py +43 -6
autobyteus/tools/mcp/__init__.py +2 -0
autobyteus/tools/mcp/config_service.py +5 -1
autobyteus/tools/mcp/server/__init__.py +2 -0
autobyteus/tools/mcp/server/http_managed_mcp_server.py +1 -1
autobyteus/tools/mcp/server/websocket_managed_mcp_server.py +141 -0
autobyteus/tools/mcp/server_instance_manager.py +8 -1
autobyteus/tools/mcp/types.py +61 -0
autobyteus/tools/multimedia/audio_tools.py +70 -17
autobyteus/tools/multimedia/download_media_tool.py +18 -4
autobyteus/tools/multimedia/image_tools.py +246 -62
autobyteus/tools/operation_executor/journal_manager.py +107 -0
autobyteus/tools/operation_executor/operation_event_buffer.py +57 -0
autobyteus/tools/operation_executor/operation_event_producer.py +29 -0
autobyteus/tools/operation_executor/operation_executor.py +58 -0
autobyteus/tools/registry/tool_definition.py +43 -2
autobyteus/tools/skill/load_skill.py +50 -0
autobyteus/tools/terminal/__init__.py +45 -0
autobyteus/tools/terminal/ansi_utils.py +32 -0
autobyteus/tools/terminal/background_process_manager.py +233 -0
autobyteus/tools/terminal/output_buffer.py +105 -0
autobyteus/tools/terminal/prompt_detector.py +63 -0
autobyteus/tools/terminal/pty_session.py +241 -0
autobyteus/tools/terminal/session_factory.py +20 -0
autobyteus/tools/terminal/terminal_session_manager.py +226 -0
autobyteus/tools/terminal/tools/__init__.py +13 -0
autobyteus/tools/terminal/tools/get_process_output.py +81 -0
autobyteus/tools/terminal/tools/run_bash.py +109 -0
autobyteus/tools/terminal/tools/start_background_process.py +104 -0
autobyteus/tools/terminal/tools/stop_background_process.py +67 -0
autobyteus/tools/terminal/types.py +54 -0
autobyteus/tools/terminal/wsl_tmux_session.py +221 -0
autobyteus/tools/terminal/wsl_utils.py +156 -0
autobyteus/tools/transaction_management/backup_handler.py +48 -0
autobyteus/tools/transaction_management/operation_lifecycle_manager.py +62 -0
autobyteus/tools/usage/__init__.py +1 -2
autobyteus/tools/usage/formatters/__init__.py +17 -1
autobyteus/tools/usage/formatters/base_formatter.py +8 -0
autobyteus/tools/usage/formatters/default_xml_schema_formatter.py +2 -2
autobyteus/tools/usage/formatters/mistral_json_schema_formatter.py +18 -0
autobyteus/tools/usage/formatters/patch_file_xml_example_formatter.py +64 -0
autobyteus/tools/usage/formatters/patch_file_xml_schema_formatter.py +31 -0
autobyteus/tools/usage/formatters/run_bash_xml_example_formatter.py +32 -0
autobyteus/tools/usage/formatters/run_bash_xml_schema_formatter.py +36 -0
autobyteus/tools/usage/formatters/write_file_xml_example_formatter.py +53 -0
autobyteus/tools/usage/formatters/write_file_xml_schema_formatter.py +31 -0
autobyteus/tools/usage/providers/tool_manifest_provider.py +10 -10
autobyteus/tools/usage/registries/__init__.py +1 -3
autobyteus/tools/usage/registries/tool_formatting_registry.py +115 -8
autobyteus/tools/usage/tool_schema_provider.py +51 -0
autobyteus/tools/web/__init__.py +4 -0
autobyteus/tools/web/read_url_tool.py +80 -0
autobyteus/utils/diff_utils.py +271 -0
autobyteus/utils/download_utils.py +109 -0
autobyteus/utils/file_utils.py +57 -2
autobyteus/utils/gemini_helper.py +56 -0
autobyteus/utils/gemini_model_mapping.py +71 -0
autobyteus/utils/llm_output_formatter.py +75 -0
autobyteus/utils/tool_call_format.py +36 -0
autobyteus/workflow/agentic_workflow.py +3 -3
autobyteus/workflow/bootstrap_steps/agent_tool_injection_step.py +2 -2
autobyteus/workflow/bootstrap_steps/base_workflow_bootstrap_step.py +2 -2
autobyteus/workflow/bootstrap_steps/coordinator_initialization_step.py +2 -2
autobyteus/workflow/bootstrap_steps/coordinator_prompt_preparation_step.py +3 -9
autobyteus/workflow/bootstrap_steps/workflow_bootstrapper.py +6 -6
autobyteus/workflow/bootstrap_steps/workflow_runtime_queue_initialization_step.py +2 -2
autobyteus/workflow/context/workflow_context.py +3 -3
autobyteus/workflow/context/workflow_runtime_state.py +5 -5
autobyteus/workflow/events/workflow_event_dispatcher.py +5 -5
autobyteus/workflow/handlers/lifecycle_workflow_event_handler.py +3 -3
autobyteus/workflow/handlers/process_user_message_event_handler.py +5 -5
autobyteus/workflow/handlers/tool_approval_workflow_event_handler.py +2 -2
autobyteus/workflow/runtime/workflow_runtime.py +8 -8
autobyteus/workflow/runtime/workflow_worker.py +3 -3
autobyteus/workflow/status/__init__.py +11 -0
autobyteus/workflow/status/workflow_status.py +19 -0
autobyteus/workflow/status/workflow_status_manager.py +48 -0
autobyteus/workflow/streaming/__init__.py +2 -2
autobyteus/workflow/streaming/workflow_event_notifier.py +7 -7
autobyteus/workflow/streaming/workflow_stream_event_payloads.py +4 -4
autobyteus/workflow/streaming/workflow_stream_events.py +3 -3
autobyteus/workflow/utils/wait_for_idle.py +4 -4
autobyteus-1.2.3.dist-info/METADATA +293 -0
autobyteus-1.2.3.dist-info/RECORD +600 -0
{autobyteus-1.2.1.dist-info → autobyteus-1.2.3.dist-info}/WHEEL +1 -1
{autobyteus-1.2.1.dist-info → autobyteus-1.2.3.dist-info}/top_level.txt +0 -1
autobyteus/agent/bootstrap_steps/agent_runtime_queue_initialization_step.py +0 -57
autobyteus/agent/hooks/__init__.py +0 -16
autobyteus/agent/hooks/base_phase_hook.py +0 -78
autobyteus/agent/hooks/hook_definition.py +0 -36
autobyteus/agent/hooks/hook_meta.py +0 -37
autobyteus/agent/hooks/hook_registry.py +0 -106
autobyteus/agent/llm_response_processor/provider_aware_tool_usage_processor.py +0 -103
autobyteus/agent/phases/__init__.py +0 -18
autobyteus/agent/phases/discover.py +0 -53
autobyteus/agent/phases/manager.py +0 -265
autobyteus/agent/phases/transition_decorator.py +0 -40
autobyteus/agent/phases/transition_info.py +0 -33
autobyteus/agent/remote_agent.py +0 -244
autobyteus/agent/workspace/workspace_definition.py +0 -36
autobyteus/agent/workspace/workspace_meta.py +0 -37
autobyteus/agent/workspace/workspace_registry.py +0 -72
autobyteus/agent_team/bootstrap_steps/agent_team_runtime_queue_initialization_step.py +0 -25
autobyteus/agent_team/bootstrap_steps/coordinator_prompt_preparation_step.py +0 -85
autobyteus/agent_team/phases/__init__.py +0 -11
autobyteus/agent_team/phases/agent_team_operational_phase.py +0 -19
autobyteus/agent_team/phases/agent_team_phase_manager.py +0 -48
autobyteus/llm/api/bedrock_llm.py +0 -92
autobyteus/llm/api/groq_llm.py +0 -94
autobyteus/llm/api/nvidia_llm.py +0 -108
autobyteus/llm/utils/token_pricing_config.py +0 -87
autobyteus/rpc/__init__.py +0 -73
autobyteus/rpc/client/__init__.py +0 -17
autobyteus/rpc/client/abstract_client_connection.py +0 -124
autobyteus/rpc/client/client_connection_manager.py +0 -153
autobyteus/rpc/client/sse_client_connection.py +0 -306
autobyteus/rpc/client/stdio_client_connection.py +0 -280
autobyteus/rpc/config/__init__.py +0 -13
autobyteus/rpc/config/agent_server_config.py +0 -153
autobyteus/rpc/config/agent_server_registry.py +0 -152
autobyteus/rpc/hosting.py +0 -244
autobyteus/rpc/protocol.py +0 -244
autobyteus/rpc/server/__init__.py +0 -20
autobyteus/rpc/server/agent_server_endpoint.py +0 -181
autobyteus/rpc/server/base_method_handler.py +0 -40
autobyteus/rpc/server/method_handlers.py +0 -259
autobyteus/rpc/server/sse_server_handler.py +0 -182
autobyteus/rpc/server/stdio_server_handler.py +0 -151
autobyteus/rpc/server_main.py +0 -198
autobyteus/rpc/transport_type.py +0 -13
autobyteus/tools/bash/__init__.py +0 -2
autobyteus/tools/bash/bash_executor.py +0 -100
autobyteus/tools/browser/__init__.py +0 -2
autobyteus/tools/browser/session_aware/browser_session_aware_navigate_to.py +0 -75
autobyteus/tools/browser/session_aware/browser_session_aware_tool.py +0 -30
autobyteus/tools/browser/session_aware/browser_session_aware_web_element_trigger.py +0 -154
autobyteus/tools/browser/session_aware/browser_session_aware_webpage_reader.py +0 -89
autobyteus/tools/browser/session_aware/browser_session_aware_webpage_screenshot_taker.py +0 -107
autobyteus/tools/browser/session_aware/factory/browser_session_aware_web_element_trigger_factory.py +0 -14
autobyteus/tools/browser/session_aware/factory/browser_session_aware_webpage_reader_factory.py +0 -26
autobyteus/tools/browser/session_aware/factory/browser_session_aware_webpage_screenshot_taker_factory.py +0 -14
autobyteus/tools/browser/session_aware/shared_browser_session.py +0 -11
autobyteus/tools/browser/session_aware/shared_browser_session_manager.py +0 -25
autobyteus/tools/browser/session_aware/web_element_action.py +0 -20
autobyteus/tools/browser/standalone/__init__.py +0 -6
autobyteus/tools/browser/standalone/factory/__init__.py +0 -0
autobyteus/tools/browser/standalone/factory/webpage_reader_factory.py +0 -25
autobyteus/tools/browser/standalone/factory/webpage_screenshot_taker_factory.py +0 -14
autobyteus/tools/browser/standalone/navigate_to.py +0 -84
autobyteus/tools/browser/standalone/web_page_pdf_generator.py +0 -101
autobyteus/tools/browser/standalone/webpage_image_downloader.py +0 -169
autobyteus/tools/browser/standalone/webpage_reader.py +0 -105
autobyteus/tools/browser/standalone/webpage_screenshot_taker.py +0 -105
autobyteus/tools/file/edit_file.py +0 -200
autobyteus/tools/file/list_directory.py +0 -168
autobyteus/tools/file/search_files.py +0 -188
autobyteus/tools/timer.py +0 -175
autobyteus/tools/usage/parsers/__init__.py +0 -22
autobyteus/tools/usage/parsers/_json_extractor.py +0 -99
autobyteus/tools/usage/parsers/_string_decoders.py +0 -18
autobyteus/tools/usage/parsers/anthropic_xml_tool_usage_parser.py +0 -10
autobyteus/tools/usage/parsers/base_parser.py +0 -41
autobyteus/tools/usage/parsers/default_json_tool_usage_parser.py +0 -83
autobyteus/tools/usage/parsers/default_xml_tool_usage_parser.py +0 -316
autobyteus/tools/usage/parsers/exceptions.py +0 -13
autobyteus/tools/usage/parsers/gemini_json_tool_usage_parser.py +0 -77
autobyteus/tools/usage/parsers/openai_json_tool_usage_parser.py +0 -149
autobyteus/tools/usage/parsers/provider_aware_tool_usage_parser.py +0 -59
autobyteus/tools/usage/registries/tool_usage_parser_registry.py +0 -62
autobyteus/workflow/phases/__init__.py +0 -11
autobyteus/workflow/phases/workflow_operational_phase.py +0 -19
autobyteus/workflow/phases/workflow_phase_manager.py +0 -48
autobyteus-1.2.1.dist-info/METADATA +0 -205
autobyteus-1.2.1.dist-info/RECORD +0 -511
examples/__init__.py +0 -1
examples/agent_team/__init__.py +0 -1
examples/discover_phase_transitions.py +0 -104
examples/run_agentic_software_engineer.py +0 -239
examples/run_browser_agent.py +0 -262
examples/run_google_slides_agent.py +0 -287
examples/run_mcp_browser_client.py +0 -174
examples/run_mcp_google_slides_client.py +0 -270
examples/run_mcp_list_tools.py +0 -189
examples/run_poem_writer.py +0 -284
examples/run_sqlite_agent.py +0 -295
/autobyteus/{tools/browser/session_aware → skills}/__init__.py +0 -0
/autobyteus/tools/{browser/session_aware/factory → skill}/__init__.py +0 -0
{autobyteus-1.2.1.dist-info → autobyteus-1.2.3.dist-info}/licenses/LICENSE +0 -0

autobyteus/llm/api/autobyteus_llm.py CHANGED Viewed

@@ -4,8 +4,9 @@ from autobyteus.llm.models import LLMModel
 from autobyteus.llm.utils.llm_config import LLMConfig
 from autobyteus.llm.utils.token_usage import TokenUsage
 from autobyteus.llm.utils.response_types import CompleteResponse, ChunkResponse
-from autobyteus.llm.user_message import LLMUserMessage
+from autobyteus.llm.utils.messages import Message
 from autobyteus.clients import AutobyteusClient
+from autobyteus.llm.prompt_renderers.autobyteus_prompt_renderer import AutobyteusPromptRenderer
 import logging
 import uuid
@@ -20,26 +21,34 @@ class AutobyteusLLM(BaseLLM):
         self.client = AutobyteusClient(server_url=self.model.host_url)
         self.conversation_id = str(uuid.uuid4())
+        self._renderer = AutobyteusPromptRenderer()
         logger.info(f"AutobyteusLLM initialized for model '{self.model.model_identifier}' with conversation ID: {self.conversation_id}")
-    async def _send_user_message_to_llm(
+    async def _send_messages_to_llm(
         self,
-        user_message: LLMUserMessage,
+        messages: List[Message],
         **kwargs
     ) -> CompleteResponse:
-        self.add_user_message(user_message)
+        rendered = await self._renderer.render(messages)
+        if not rendered:
+            raise ValueError("AutobyteusLLM requires at least one user message.")
+        payload = rendered[0]
         try:
             response = await self.client.send_message(
                 conversation_id=self.conversation_id,
                 model_name=self.model.name,
-                user_message=user_message.content,
-                image_urls=user_message.image_urls,
-                audio_urls=user_message.audio_urls,
-                video_urls=user_message.video_urls
+                user_message=payload.get("content", ""),
+                image_urls=payload.get("image_urls", []),
+                audio_urls=payload.get("audio_urls", []),
+                video_urls=payload.get("video_urls", []),
             )
-            assistant_message = response['response']
-            self.add_assistant_message(assistant_message)
+            assistant_message = (
+                response.get("response")
+                or response.get("content")
+                or response.get("message")
+                or ""
+            )
             token_usage_data = response.get('token_usage') or {}
             token_usage = TokenUsage(
@@ -54,25 +63,27 @@ class AutobyteusLLM(BaseLLM):
             )
         except Exception as e:
             logger.error(f"Error processing message: {str(e)}")
-            await self._handle_error_cleanup()
             raise
-    async def _stream_user_message_to_llm(
+    async def _stream_messages_to_llm(
         self,
-        user_message: LLMUserMessage,
+        messages: List[Message],
         **kwargs
     ) -> AsyncGenerator[ChunkResponse, None]:
-        self.add_user_message(user_message)
+        rendered = await self._renderer.render(messages)
+        if not rendered:
+            raise ValueError("AutobyteusLLM requires at least one user message.")
+        payload = rendered[0]
         complete_response = ""
         try:
             async for chunk in self.client.stream_message(
                 conversation_id=self.conversation_id,
                 model_name=self.model.name,
-                user_message=user_message.content,
-                image_urls=user_message.image_urls,
-                audio_urls=user_message.audio_urls,
-                video_urls=user_message.video_urls
+                user_message=payload.get("content", ""),
+                image_urls=payload.get("image_urls", []),
+                audio_urls=payload.get("audio_urls", []),
+                video_urls=payload.get("video_urls", []),
             ):
                 if 'error' in chunk:
                     raise RuntimeError(chunk['error'])
@@ -100,24 +111,17 @@ class AutobyteusLLM(BaseLLM):
                     video_urls=chunk.get('video_urls', []),
                     usage=token_usage
                 )
-            self.add_assistant_message(complete_response)
         except Exception as e:
             logger.error(f"Error streaming message: {str(e)}")
-            await self._handle_error_cleanup()
             raise
     async def cleanup(self):
+        """
+        Clean up the remote conversation. The owning agent controls the HTTP
+        client lifecycle.
+        """
         try:
             await self.client.cleanup(self.conversation_id)
             await super().cleanup()
         except Exception as e:
             logger.error(f"Error during cleanup: {str(e)}")
-        finally:
-            await self.client.close()
-    async def _handle_error_cleanup(self):
-        try:
-            await self.cleanup()
-        except Exception as cleanup_error:
-            logger.error(f"Error during error cleanup: {str(cleanup_error)}")

autobyteus/llm/api/claude_llm.py CHANGED Viewed

@@ -1,27 +1,84 @@
-from typing import Dict, Optional, List, AsyncGenerator, Tuple
 import anthropic
 import os
 import logging
+from typing import Dict, Optional, List, AsyncGenerator, Tuple
 from autobyteus.llm.models import LLMModel
 from autobyteus.llm.base_llm import BaseLLM
 from autobyteus.llm.utils.llm_config import LLMConfig
 from autobyteus.llm.utils.messages import MessageRole, Message
 from autobyteus.llm.utils.token_usage import TokenUsage
 from autobyteus.llm.utils.response_types import CompleteResponse, ChunkResponse
-from autobyteus.llm.user_message import LLMUserMessage
+from autobyteus.llm.converters import convert_anthropic_tool_call
+from autobyteus.llm.prompt_renderers.anthropic_prompt_renderer import AnthropicPromptRenderer
 logger = logging.getLogger(__name__)
+def _build_thinking_param(extra_params: Dict) -> Optional[Dict]:
+    enabled = extra_params.get("thinking_enabled", False)
+    if not isinstance(enabled, bool) or not enabled:
+        return None
+    budget = extra_params.get("thinking_budget_tokens", 1024)
+    try:
+        budget_int = int(budget)
+    except (TypeError, ValueError):
+        budget_int = 1024
+    return {"type": "enabled", "budget_tokens": budget_int}
+def _split_claude_content_blocks(blocks: List) -> Tuple[str, str]:
+    """Split Claude content blocks into visible text and thinking summaries."""
+    content_segments: List[str] = []
+    thinking_segments: List[str] = []
+    for block in blocks or []:
+        block_type = getattr(block, "type", None)
+        if block_type is None and isinstance(block, dict):
+            block_type = block.get("type")
+        if block_type == "text":
+            text = getattr(block, "text", None)
+            if text is None and isinstance(block, dict):
+                text = block.get("text")
+            if text:
+                content_segments.append(text)
+        elif block_type == "thinking":
+            thinking = getattr(block, "thinking", None)
+            if thinking is None and isinstance(block, dict):
+                thinking = block.get("thinking")
+            if thinking:
+                thinking_segments.append(thinking)
+        elif block_type == "redacted_thinking":
+            redacted = getattr(block, "redacted_thinking", None)
+            if redacted is None and isinstance(block, dict):
+                redacted = block.get("redacted_thinking")
+            if redacted:
+                thinking_segments.append(redacted)
+    return "".join(content_segments), "".join(thinking_segments)
+def _split_system_message(messages: List[Message]) -> Tuple[Optional[str], List[Message]]:
+    system_parts = [msg.content for msg in messages if msg.role == MessageRole.SYSTEM and msg.content]
+    system_prompt = "\n".join(system_parts) if system_parts else None
+    remaining = [msg for msg in messages if msg.role != MessageRole.SYSTEM]
+    return system_prompt, remaining
 class ClaudeLLM(BaseLLM):
     def __init__(self, model: LLMModel = None, llm_config: LLMConfig = None):
         if model is None:
-            model = LLMModel['claude-4-sonnet']
+            model = LLMModel['claude-4.5-sonnet']
         if llm_config is None:
             llm_config = LLMConfig()
         super().__init__(model=model, llm_config=llm_config)
         self.client = self.initialize()
-        self.max_tokens = 8000
+        self._renderer = AnthropicPromptRenderer()
+        # Claude Sonnet 4.5 currently allows up to ~8k output tokens; let config override.
+        self.max_tokens = llm_config.max_tokens if llm_config.max_tokens is not None else 8192
     @classmethod
     def initialize(cls):
@@ -36,10 +93,6 @@ class ClaudeLLM(BaseLLM):
         except Exception as e:
             raise ValueError(f"Failed to initialize Anthropic client: {str(e)}")
-    def _get_non_system_messages(self) -> List[Dict]:
-        # NOTE: This will need to be updated to handle multimodal messages for Claude
-        return [msg.to_dict() for msg in self.messages if msg.role != MessageRole.SYSTEM]
     def _create_token_usage(self, input_tokens: int, output_tokens: int) -> TokenUsage:
         return TokenUsage(
             prompt_tokens=input_tokens,
@@ -47,23 +100,37 @@ class ClaudeLLM(BaseLLM):
             total_tokens=input_tokens + output_tokens
         )
-    async def _send_user_message_to_llm(self, user_message: LLMUserMessage, **kwargs) -> CompleteResponse:
-        self.add_user_message(user_message)
+    async def _send_messages_to_llm(self, messages: List[Message], **kwargs) -> CompleteResponse:
+        try:
+            system_prompt, non_system = _split_system_message(messages)
+            formatted_messages = await self._renderer.render(non_system)
+            thinking_param = _build_thinking_param(self.config.extra_params)
-        # NOTE: This implementation does not yet support multimodal inputs for Claude.
-        # It will only send the text content.
+            request_kwargs = {
+                "model": self.model.value,
+                "max_tokens": self.max_tokens,
+                "messages": formatted_messages,
+            }
+            if system_prompt:
+                request_kwargs["system"] = system_prompt
+            if thinking_param:
+                # Extended thinking is not compatible with temperature modifications
+                request_kwargs["thinking"] = thinking_param
+            else:
+                request_kwargs["temperature"] = 0
-        try:
             response = self.client.messages.create(
-                model=self.model.value,
-                max_tokens=self.max_tokens,
-                temperature=0,
-                system=self.system_message,
-                messages=self._get_non_system_messages()
+                **request_kwargs
             )
-            assistant_message = response.content[0].text
-            self.add_assistant_message(assistant_message)
+            assistant_message = getattr(response, "text", "") or ""
+            reasoning_summary = None
+            if response.content:
+                parsed_text, parsed_thinking = _split_claude_content_blocks(response.content)
+                if parsed_text:
+                    assistant_message = parsed_text
+                if parsed_thinking:
+                    reasoning_summary = parsed_thinking
             token_usage = self._create_token_usage(
                 response.usage.input_tokens,
@@ -74,35 +141,72 @@ class ClaudeLLM(BaseLLM):
             return CompleteResponse(
                 content=assistant_message,
+                reasoning=reasoning_summary,
                 usage=token_usage
             )
         except anthropic.APIError as e:
             logger.error(f"Error in Claude API call: {str(e)}")
             raise ValueError(f"Error in Claude API call: {str(e)}")
-    async def _stream_user_message_to_llm(
-        self, user_message: LLMUserMessage, **kwargs
+    async def _stream_messages_to_llm(
+        self, messages: List[Message], **kwargs
     ) -> AsyncGenerator[ChunkResponse, None]:
-        self.add_user_message(user_message)
         complete_response = ""
+        complete_reasoning = ""
         final_message = None
-        # NOTE: This implementation does not yet support multimodal inputs for Claude.
-        # It will only send the text content.
+        # Extract tools if provided
+        tools = kwargs.get("tools")
         try:
-            with self.client.messages.stream(
-                model=self.model.value,
-                max_tokens=self.max_tokens,
-                temperature=0,
-                system=self.system_message,
-                messages=self._get_non_system_messages(),
-            ) as stream:
+            # Prepare arguments for stream
+            system_prompt, non_system = _split_system_message(messages)
+            formatted_messages = await self._renderer.render(non_system)
+            thinking_param = _build_thinking_param(self.config.extra_params)
+            stream_kwargs = {
+                "model": self.model.value,
+                "max_tokens": self.max_tokens,
+                "messages": formatted_messages,
+            }
+            if system_prompt:
+                stream_kwargs["system"] = system_prompt
+            if thinking_param:
+                # Extended thinking is not compatible with temperature modifications
+                stream_kwargs["thinking"] = thinking_param
+            else:
+                stream_kwargs["temperature"] = 0
+            if tools:
+                stream_kwargs["tools"] = tools
+            with self.client.messages.stream(**stream_kwargs) as stream:
                 for event in stream:
-                    if event.type == "content_block_delta" and event.delta.type == "text_delta":
-                        complete_response += event.delta.text
+                    # Handle text content
+                    if event.type == "content_block_delta":
+                        delta_type = getattr(event.delta, "type", None)
+                        if delta_type == "text_delta":
+                            complete_response += event.delta.text
+                            yield ChunkResponse(
+                                content=event.delta.text,
+                                is_complete=False
+                            )
+                        elif delta_type == "thinking_delta":
+                            thinking_delta = getattr(event.delta, "thinking", None)
+                            if thinking_delta:
+                                complete_reasoning += thinking_delta
+                                yield ChunkResponse(
+                                    content="",
+                                    reasoning=thinking_delta,
+                                    is_complete=False
+                                )
+                    # Handle tool calls using common converter
+                    tool_calls = convert_anthropic_tool_call(event)
+                    if tool_calls:
                         yield ChunkResponse(
-                            content=event.delta.text,
+                            content="",
+                            tool_calls=tool_calls,
                             is_complete=False
                         )
@@ -120,7 +224,9 @@ class ClaudeLLM(BaseLLM):
                         usage=token_usage
                     )
-            self.add_assistant_message(complete_response)
+            # Only add assistant message if there's actual content.
+            # Tool-call-only responses should not add empty messages, as Claude API
+            # rejects subsequent requests with "all messages must have non-empty content".
         except anthropic.APIError as e:
             logger.error(f"Error in Claude API streaming: {str(e)}")
             raise ValueError(f"Error in Claude API streaming: {str(e)}")

autobyteus/llm/api/gemini_llm.py CHANGED Viewed

@@ -1,29 +1,41 @@
 import logging
-from typing import Dict, Optional, List, AsyncGenerator, Any
-from google import genai
+import asyncio
+from typing import Dict, List, AsyncGenerator, Any, Optional
 from google.genai import types as genai_types
-import os
 from autobyteus.llm.models import LLMModel
 from autobyteus.llm.base_llm import BaseLLM
 from autobyteus.llm.utils.llm_config import LLMConfig
 from autobyteus.llm.utils.messages import MessageRole, Message
 from autobyteus.llm.utils.token_usage import TokenUsage
 from autobyteus.llm.utils.response_types import CompleteResponse, ChunkResponse
-from autobyteus.llm.user_message import LLMUserMessage
+from autobyteus.utils.gemini_helper import initialize_gemini_client_with_runtime
+from autobyteus.utils.gemini_model_mapping import resolve_model_for_runtime
+from autobyteus.llm.converters import convert_gemini_tool_calls
+from autobyteus.llm.prompt_renderers.gemini_prompt_renderer import GeminiPromptRenderer
 logger = logging.getLogger(__name__)
-def _format_gemini_history(messages: List[Message]) -> List[Dict[str, Any]]:
-    """Formats internal message history for the Gemini API."""
-    history = []
-    # System message is handled separately in the new API
-    for msg in messages:
-        if msg.role in [MessageRole.USER, MessageRole.ASSISTANT]:
-            # NOTE: This history conversion will need to be updated for multimodal messages
-            role = 'model' if msg.role == MessageRole.ASSISTANT else 'user'
-            # The `parts` must be a list of dictionaries (Part objects), not a list of strings.
-            history.append({"role": role, "parts": [{"text": msg.content}]})
-    return history
+def _split_gemini_parts(parts: List[Any]) -> tuple[str, str]:
+    """Split Gemini content parts into visible text and thought summaries."""
+    content_segments: List[str] = []
+    thought_segments: List[str] = []
+    for part in parts or []:
+        text = getattr(part, "text", None)
+        if not text:
+            continue
+        if getattr(part, "thought", False):
+            thought_segments.append(text)
+        else:
+            content_segments.append(text)
+    return "".join(content_segments), "".join(thought_segments)
+def _split_system_message(messages: List[Message]) -> tuple[Optional[str], List[Message]]:
+    system_parts = [msg.content for msg in messages if msg.role == MessageRole.SYSTEM and msg.content]
+    system_prompt = "\n".join(system_parts) if system_parts else None
+    remaining = [msg for msg in messages if msg.role != MessageRole.SYSTEM]
+    return system_prompt, remaining
 class GeminiLLM(BaseLLM):
     def __init__(self, model: LLMModel = None, llm_config: LLMConfig = None):
@@ -32,59 +44,84 @@ class GeminiLLM(BaseLLM):
         }
         if model is None:
-            model = LLMModel['gemini-2.5-flash']
+            # Default to the latest low-latency Gemini LLM.
+            model = LLMModel['gemini-3-flash-preview']
         if llm_config is None:
             llm_config = LLMConfig()
         super().__init__(model=model, llm_config=llm_config)
-        self.client = self.initialize()
-        self.async_client = self.client.aio
-    @classmethod
-    def initialize(cls) -> genai.client.Client:
-        api_key = os.environ.get("GEMINI_API_KEY")
-        if not api_key:
-            logger.error("GEMINI_API_KEY environment variable is not set.")
-            raise ValueError("GEMINI_API_KEY environment variable is not set.")
         try:
-            return genai.Client()
+            self.client, self.runtime_info = initialize_gemini_client_with_runtime()
+            self.async_client = self.client.aio
+            self._renderer = GeminiPromptRenderer()
         except Exception as e:
-            logger.error(f"Failed to initialize Gemini client: {str(e)}")
-            raise ValueError(f"Failed to initialize Gemini client: {str(e)}")
+            # Re-raise or handle initialization errors specifically for the LLM context if needed
+            logger.error(f"Failed to initialize Gemini LLM: {str(e)}")
+            raise
-    def _get_generation_config(self) -> genai_types.GenerateContentConfig:
+    def _get_generation_config(self, system_prompt: Optional[str] = None) -> genai_types.GenerateContentConfig:
         """Builds the generation config, handling special cases like 'thinking'."""
         config = self.generation_config_dict.copy()
-        thinking_config = None
-        if "flash" in self.model.value:
-            thinking_config = genai_types.ThinkingConfig(thinking_budget=0)
+        # Map thinking_level to token budget
+        # Values based on Gemini 3 API recommendations
+        THINKING_LEVEL_BUDGETS = {
+            "minimal": 0,
+            "low": 1024,
+            "medium": 4096,
+            "high": 16384,
+        }
-        # System instruction is now part of the config
-        system_instruction = self.system_message if self.system_message else None
+        # Read thinking_level from extra_params (set by user config)
+        # Default to "minimal" (0 tokens) for backward compatibility
+        thinking_level = self.config.extra_params.get("thinking_level", "minimal")
+        thinking_budget = THINKING_LEVEL_BUDGETS.get(thinking_level, 0)
+        include_thoughts = self.config.extra_params.get("include_thoughts", False)
+        if not isinstance(include_thoughts, bool):
+            include_thoughts = False
+        thinking_config = genai_types.ThinkingConfig(
+            thinking_budget=thinking_budget,
+            include_thoughts=include_thoughts
+        )
+        # System instruction is now part of the config
+        system_instruction = system_prompt if system_prompt is not None else self.system_message
         return genai_types.GenerateContentConfig(
             **config,
             thinking_config=thinking_config,
             system_instruction=system_instruction
         )
-    async def _send_user_message_to_llm(self, user_message: LLMUserMessage, **kwargs) -> CompleteResponse:
-        self.add_user_message(user_message)
+    async def _send_messages_to_llm(self, messages: List[Message], **kwargs) -> CompleteResponse:
         try:
-            history = _format_gemini_history(self.messages)
-            generation_config = self._get_generation_config()
+            system_prompt, non_system = _split_system_message(messages)
+            history = await self._renderer.render(non_system)
+            generation_config = self._get_generation_config(system_prompt=system_prompt)
+            # FIX: Removed 'models/' prefix to support Vertex AI
+            runtime_adjusted_model = resolve_model_for_runtime(
+                self.model.value,
+                modality="llm",
+                runtime=getattr(self, "runtime_info", None) and self.runtime_info.runtime,
+            )
             response = await self.async_client.models.generate_content(
-                model=f"models/{self.model.value}",
+                model=runtime_adjusted_model,
                 contents=history,
                 config=generation_config,
             )
-            assistant_message = response.text
-            self.add_assistant_message(assistant_message)
+            assistant_message = response.text or ""
+            reasoning_summary = None
+            if response.candidates and response.candidates[0].content and response.candidates[0].content.parts:
+                parsed_text, parsed_thoughts = _split_gemini_parts(response.candidates[0].content.parts)
+                if parsed_text:
+                    assistant_message = parsed_text
+                if parsed_thoughts:
+                    reasoning_summary = parsed_thoughts
             token_usage = TokenUsage(
                 prompt_tokens=0,
                 completion_tokens=0,
@@ -93,35 +130,102 @@ class GeminiLLM(BaseLLM):
             return CompleteResponse(
                 content=assistant_message,
+                reasoning=reasoning_summary,
                 usage=token_usage
             )
         except Exception as e:
             logger.error(f"Error in Gemini API call: {str(e)}")
             raise ValueError(f"Error in Gemini API call: {str(e)}")
-    async def _stream_user_message_to_llm(self, user_message: LLMUserMessage, **kwargs) -> AsyncGenerator[ChunkResponse, None]:
-        self.add_user_message(user_message)
+    async def _stream_messages_to_llm(self, messages: List[Message], **kwargs) -> AsyncGenerator[ChunkResponse, None]:
         complete_response = ""
+        complete_reasoning = ""
+        # Extract tools if provided
+        tools = kwargs.get("tools")
         try:
-            history = _format_gemini_history(self.messages)
-            generation_config = self._get_generation_config()
+            system_prompt, non_system = _split_system_message(messages)
+            history = await self._renderer.render(non_system)
+            generation_config = self._get_generation_config(system_prompt=system_prompt)
+            # Add tools to config if present
+            # Note: In google.genai, tools can be passed in config
+            if tools:
+                # Auto-wrap tools if they appear to be raw function declarations
+                if isinstance(tools, list) and len(tools) > 0:
+                    first_tool = tools[0]
+                    # Check if it's a raw declaration (dict with name/description) but NOT a wrapper (dict with function_declarations)
+                    if isinstance(first_tool, dict):
+                        is_declaration = "name" in first_tool and "description" in first_tool
+                        is_wrapper = "function_declarations" in first_tool
+                        if is_declaration and not is_wrapper:
+                             # Wrap the list of declarations into a single Tool structure
+                             tools = [{"function_declarations": tools}]
-            response_stream = await self.async_client.models.generate_content_stream(
-                model=f"models/{self.model.value}",
-                contents=history,
-                config=generation_config,
+                try:
+                    generation_config.tools = tools
+                except Exception:
+                    # Fallback or strict strict typing issues
+                    pass
+            # FIX: Removed 'models/' prefix to support Vertex AI
+            runtime_adjusted_model = resolve_model_for_runtime(
+                self.model.value,
+                modality="llm",
+                runtime=getattr(self, "runtime_info", None) and self.runtime_info.runtime,
             )
+            # Prepare call args
+            call_kwargs = {
+                "model": runtime_adjusted_model,
+                "contents": history,
+                "config": generation_config,
+            }
+            # If explicit tools argument is needed and not supported in config for this SDK version:
+            # call_kwargs['tools'] = tools
+            # But usually config holds it.
+            response_stream = await self.async_client.models.generate_content_stream(**call_kwargs)
             async for chunk in response_stream:
-                chunk_text = chunk.text
-                complete_response += chunk_text
-                yield ChunkResponse(
-                    content=chunk_text,
-                    is_complete=False
-                )
-            self.add_assistant_message(complete_response)
+                handled_parts = False
+                if chunk.candidates and chunk.candidates[0].content and chunk.candidates[0].content.parts:
+                    handled_parts = True
+                    for part in chunk.candidates[0].content.parts:
+                        part_text = getattr(part, "text", None)
+                        if part_text:
+                            if getattr(part, "thought", False):
+                                complete_reasoning += part_text
+                                yield ChunkResponse(
+                                    content="",
+                                    reasoning=part_text,
+                                    is_complete=False
+                                )
+                            else:
+                                complete_response += part_text
+                                yield ChunkResponse(
+                                    content=part_text,
+                                    is_complete=False
+                                )
+                        tool_calls = convert_gemini_tool_calls(part)
+                        if tool_calls:
+                            yield ChunkResponse(
+                                content="",
+                                tool_calls=tool_calls,
+                                is_complete=False
+                            )
+                if not handled_parts:
+                    chunk_text = chunk.text
+                    if chunk_text:
+                        complete_response += chunk_text
+                        yield ChunkResponse(
+                            content=chunk_text,
+                            is_complete=False
+                        )
             token_usage = TokenUsage(
                 prompt_tokens=0,

autobyteus/llm/api/grok_llm.py CHANGED Viewed

@@ -10,7 +10,7 @@ class GrokLLM(OpenAICompatibleLLM):
     def __init__(self, model: LLMModel = None, llm_config: LLMConfig = None):
         # Provide defaults if not specified
         if model is None:
-            model = LLMModel['grok-2-1212']
+            model = LLMModel['grok-4-1-fast-reasoning']
         if llm_config is None:
             llm_config = LLMConfig()

autobyteus 1.2.1__py3-none-any.whl → 1.2.3__py3-none-any.whl

autobyteus 1.2.1py3-none-any.whl → 1.2.3py3-none-any.whl