PyPI - autobyteus - Versions diffs - 1.2.1__py3-none-any.whl → 1.2.3__py3-none-any.whl - Mend

autobyteus 1.2.1py3-none-any.whl → 1.2.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (466) hide show

autobyteus/agent/agent.py +15 -5
autobyteus/agent/bootstrap_steps/__init__.py +1 -3
autobyteus/agent/bootstrap_steps/agent_bootstrapper.py +3 -59
autobyteus/agent/bootstrap_steps/base_bootstrap_step.py +1 -4
autobyteus/agent/bootstrap_steps/mcp_server_prewarming_step.py +1 -3
autobyteus/agent/bootstrap_steps/system_prompt_processing_step.py +16 -13
autobyteus/agent/bootstrap_steps/workspace_context_initialization_step.py +2 -4
autobyteus/agent/context/agent_config.py +43 -20
autobyteus/agent/context/agent_context.py +23 -18
autobyteus/agent/context/agent_runtime_state.py +19 -19
autobyteus/agent/events/__init__.py +16 -1
autobyteus/agent/events/agent_events.py +43 -3
autobyteus/agent/events/agent_input_event_queue_manager.py +79 -26
autobyteus/agent/events/event_store.py +57 -0
autobyteus/agent/events/notifiers.py +69 -59
autobyteus/agent/events/worker_event_dispatcher.py +21 -64
autobyteus/agent/factory/agent_factory.py +52 -0
autobyteus/agent/handlers/__init__.py +2 -0
autobyteus/agent/handlers/approved_tool_invocation_event_handler.py +51 -34
autobyteus/agent/handlers/bootstrap_event_handler.py +155 -0
autobyteus/agent/handlers/inter_agent_message_event_handler.py +10 -0
autobyteus/agent/handlers/lifecycle_event_logger.py +19 -11
autobyteus/agent/handlers/llm_complete_response_received_event_handler.py +10 -15
autobyteus/agent/handlers/llm_user_message_ready_event_handler.py +188 -48
autobyteus/agent/handlers/tool_execution_approval_event_handler.py +0 -10
autobyteus/agent/handlers/tool_invocation_request_event_handler.py +53 -48
autobyteus/agent/handlers/tool_result_event_handler.py +7 -8
autobyteus/agent/handlers/user_input_message_event_handler.py +10 -3
autobyteus/agent/input_processor/memory_ingest_input_processor.py +40 -0
autobyteus/agent/lifecycle/__init__.py +12 -0
autobyteus/agent/lifecycle/base_processor.py +109 -0
autobyteus/agent/lifecycle/events.py +35 -0
autobyteus/agent/lifecycle/processor_definition.py +36 -0
autobyteus/agent/lifecycle/processor_registry.py +106 -0
autobyteus/agent/llm_request_assembler.py +98 -0
autobyteus/agent/llm_response_processor/__init__.py +1 -8
autobyteus/agent/message/context_file_type.py +1 -1
autobyteus/agent/runtime/agent_runtime.py +29 -21
autobyteus/agent/runtime/agent_worker.py +98 -19
autobyteus/agent/shutdown_steps/__init__.py +2 -0
autobyteus/agent/shutdown_steps/agent_shutdown_orchestrator.py +2 -0
autobyteus/agent/shutdown_steps/tool_cleanup_step.py +58 -0
autobyteus/agent/status/__init__.py +14 -0
autobyteus/agent/status/manager.py +93 -0
autobyteus/agent/status/status_deriver.py +96 -0
autobyteus/agent/{phases/phase_enum.py → status/status_enum.py} +16 -16
autobyteus/agent/status/status_update_utils.py +73 -0
autobyteus/agent/streaming/__init__.py +52 -5
autobyteus/agent/streaming/adapters/__init__.py +18 -0
autobyteus/agent/streaming/adapters/invocation_adapter.py +184 -0
autobyteus/agent/streaming/adapters/tool_call_parsing.py +163 -0
autobyteus/agent/streaming/adapters/tool_syntax_registry.py +67 -0
autobyteus/agent/streaming/agent_event_stream.py +3 -183
autobyteus/agent/streaming/api_tool_call/__init__.py +16 -0
autobyteus/agent/streaming/api_tool_call/file_content_streamer.py +56 -0
autobyteus/agent/streaming/api_tool_call/json_string_field_extractor.py +175 -0
autobyteus/agent/streaming/api_tool_call_streaming_response_handler.py +4 -0
autobyteus/agent/streaming/events/__init__.py +6 -0
autobyteus/agent/streaming/events/stream_event_payloads.py +284 -0
autobyteus/agent/streaming/events/stream_events.py +141 -0
autobyteus/agent/streaming/handlers/__init__.py +15 -0
autobyteus/agent/streaming/handlers/api_tool_call_streaming_response_handler.py +303 -0
autobyteus/agent/streaming/handlers/parsing_streaming_response_handler.py +107 -0
autobyteus/agent/streaming/handlers/pass_through_streaming_response_handler.py +107 -0
autobyteus/agent/streaming/handlers/streaming_handler_factory.py +177 -0
autobyteus/agent/streaming/handlers/streaming_response_handler.py +58 -0
autobyteus/agent/streaming/parser/__init__.py +61 -0
autobyteus/agent/streaming/parser/event_emitter.py +181 -0
autobyteus/agent/streaming/parser/events.py +4 -0
autobyteus/agent/streaming/parser/invocation_adapter.py +4 -0
autobyteus/agent/streaming/parser/json_parsing_strategies/__init__.py +19 -0
autobyteus/agent/streaming/parser/json_parsing_strategies/base.py +32 -0
autobyteus/agent/streaming/parser/json_parsing_strategies/default.py +34 -0
autobyteus/agent/streaming/parser/json_parsing_strategies/gemini.py +31 -0
autobyteus/agent/streaming/parser/json_parsing_strategies/openai.py +64 -0
autobyteus/agent/streaming/parser/json_parsing_strategies/registry.py +75 -0
autobyteus/agent/streaming/parser/parser_context.py +227 -0
autobyteus/agent/streaming/parser/parser_factory.py +132 -0
autobyteus/agent/streaming/parser/sentinel_format.py +7 -0
autobyteus/agent/streaming/parser/state_factory.py +62 -0
autobyteus/agent/streaming/parser/states/__init__.py +1 -0
autobyteus/agent/streaming/parser/states/base_state.py +60 -0
autobyteus/agent/streaming/parser/states/custom_xml_tag_run_bash_parsing_state.py +38 -0
autobyteus/agent/streaming/parser/states/custom_xml_tag_write_file_parsing_state.py +55 -0
autobyteus/agent/streaming/parser/states/delimited_content_state.py +146 -0
autobyteus/agent/streaming/parser/states/json_initialization_state.py +144 -0
autobyteus/agent/streaming/parser/states/json_tool_parsing_state.py +137 -0
autobyteus/agent/streaming/parser/states/sentinel_content_state.py +30 -0
autobyteus/agent/streaming/parser/states/sentinel_initialization_state.py +117 -0
autobyteus/agent/streaming/parser/states/text_state.py +78 -0
autobyteus/agent/streaming/parser/states/xml_patch_file_tool_parsing_state.py +328 -0
autobyteus/agent/streaming/parser/states/xml_run_bash_tool_parsing_state.py +129 -0
autobyteus/agent/streaming/parser/states/xml_tag_initialization_state.py +151 -0
autobyteus/agent/streaming/parser/states/xml_tool_parsing_state.py +63 -0
autobyteus/agent/streaming/parser/states/xml_write_file_tool_parsing_state.py +343 -0
autobyteus/agent/streaming/parser/strategies/__init__.py +17 -0
autobyteus/agent/streaming/parser/strategies/base.py +24 -0
autobyteus/agent/streaming/parser/strategies/json_tool_strategy.py +26 -0
autobyteus/agent/streaming/parser/strategies/registry.py +28 -0
autobyteus/agent/streaming/parser/strategies/sentinel_strategy.py +23 -0
autobyteus/agent/streaming/parser/strategies/xml_tag_strategy.py +21 -0
autobyteus/agent/streaming/parser/stream_scanner.py +167 -0
autobyteus/agent/streaming/parser/streaming_parser.py +212 -0
autobyteus/agent/streaming/parser/tool_call_parsing.py +4 -0
autobyteus/agent/streaming/parser/tool_constants.py +7 -0
autobyteus/agent/streaming/parser/tool_syntax_registry.py +4 -0
autobyteus/agent/streaming/parser/xml_tool_parsing_state_registry.py +55 -0
autobyteus/agent/streaming/parsing_streaming_response_handler.py +4 -0
autobyteus/agent/streaming/pass_through_streaming_response_handler.py +4 -0
autobyteus/agent/streaming/queue_streamer.py +3 -57
autobyteus/agent/streaming/segments/__init__.py +5 -0
autobyteus/agent/streaming/segments/segment_events.py +81 -0
autobyteus/agent/streaming/stream_event_payloads.py +2 -223
autobyteus/agent/streaming/stream_events.py +3 -140
autobyteus/agent/streaming/streaming_handler_factory.py +4 -0
autobyteus/agent/streaming/streaming_response_handler.py +4 -0
autobyteus/agent/streaming/streams/__init__.py +5 -0
autobyteus/agent/streaming/streams/agent_event_stream.py +197 -0
autobyteus/agent/streaming/utils/__init__.py +5 -0
autobyteus/agent/streaming/utils/queue_streamer.py +59 -0
autobyteus/agent/system_prompt_processor/__init__.py +2 -0
autobyteus/agent/system_prompt_processor/available_skills_processor.py +96 -0
autobyteus/agent/system_prompt_processor/base_processor.py +1 -1
autobyteus/agent/system_prompt_processor/processor_meta.py +15 -2
autobyteus/agent/system_prompt_processor/tool_manifest_injector_processor.py +39 -58
autobyteus/agent/token_budget.py +56 -0
autobyteus/agent/tool_execution_result_processor/memory_ingest_tool_result_processor.py +29 -0
autobyteus/agent/tool_invocation.py +16 -40
autobyteus/agent/tool_invocation_preprocessor/__init__.py +9 -0
autobyteus/agent/tool_invocation_preprocessor/base_preprocessor.py +45 -0
autobyteus/agent/tool_invocation_preprocessor/processor_definition.py +15 -0
autobyteus/agent/tool_invocation_preprocessor/processor_meta.py +33 -0
autobyteus/agent/tool_invocation_preprocessor/processor_registry.py +60 -0
autobyteus/agent/utils/wait_for_idle.py +12 -14
autobyteus/agent/workspace/base_workspace.py +6 -27
autobyteus/agent_team/agent_team.py +3 -3
autobyteus/agent_team/agent_team_builder.py +1 -41
autobyteus/agent_team/bootstrap_steps/__init__.py +0 -4
autobyteus/agent_team/bootstrap_steps/agent_configuration_preparation_step.py +8 -18
autobyteus/agent_team/bootstrap_steps/agent_team_bootstrapper.py +4 -16
autobyteus/agent_team/bootstrap_steps/base_agent_team_bootstrap_step.py +1 -2
autobyteus/agent_team/bootstrap_steps/coordinator_initialization_step.py +1 -2
autobyteus/agent_team/bootstrap_steps/task_notifier_initialization_step.py +1 -2
autobyteus/agent_team/bootstrap_steps/team_context_initialization_step.py +4 -4
autobyteus/agent_team/context/agent_team_config.py +6 -3
autobyteus/agent_team/context/agent_team_context.py +25 -3
autobyteus/agent_team/context/agent_team_runtime_state.py +9 -6
autobyteus/agent_team/events/__init__.py +11 -0
autobyteus/agent_team/events/agent_team_event_dispatcher.py +22 -9
autobyteus/agent_team/events/agent_team_events.py +16 -0
autobyteus/agent_team/events/event_store.py +57 -0
autobyteus/agent_team/factory/agent_team_factory.py +8 -0
autobyteus/agent_team/handlers/inter_agent_message_request_event_handler.py +18 -2
autobyteus/agent_team/handlers/lifecycle_agent_team_event_handler.py +21 -5
autobyteus/agent_team/handlers/process_user_message_event_handler.py +17 -8
autobyteus/agent_team/handlers/tool_approval_team_event_handler.py +19 -4
autobyteus/agent_team/runtime/agent_team_runtime.py +41 -10
autobyteus/agent_team/runtime/agent_team_worker.py +69 -5
autobyteus/agent_team/status/__init__.py +14 -0
autobyteus/agent_team/status/agent_team_status.py +18 -0
autobyteus/agent_team/status/agent_team_status_manager.py +33 -0
autobyteus/agent_team/status/status_deriver.py +62 -0
autobyteus/agent_team/status/status_update_utils.py +42 -0
autobyteus/agent_team/streaming/__init__.py +2 -2
autobyteus/agent_team/streaming/agent_team_event_notifier.py +6 -6
autobyteus/agent_team/streaming/agent_team_stream_event_payloads.py +4 -4
autobyteus/agent_team/streaming/agent_team_stream_events.py +3 -3
autobyteus/agent_team/system_prompt_processor/__init__.py +6 -0
autobyteus/agent_team/system_prompt_processor/team_manifest_injector_processor.py +76 -0
autobyteus/agent_team/task_notification/task_notification_mode.py +19 -0
autobyteus/agent_team/utils/wait_for_idle.py +4 -4
autobyteus/cli/agent_cli.py +18 -10
autobyteus/cli/agent_team_tui/app.py +14 -11
autobyteus/cli/agent_team_tui/state.py +13 -15
autobyteus/cli/agent_team_tui/widgets/agent_list_sidebar.py +15 -15
autobyteus/cli/agent_team_tui/widgets/focus_pane.py +143 -36
autobyteus/cli/agent_team_tui/widgets/renderables.py +1 -1
autobyteus/cli/agent_team_tui/widgets/shared.py +25 -25
autobyteus/cli/cli_display.py +193 -44
autobyteus/cli/workflow_tui/app.py +9 -10
autobyteus/cli/workflow_tui/state.py +14 -16
autobyteus/cli/workflow_tui/widgets/agent_list_sidebar.py +15 -15
autobyteus/cli/workflow_tui/widgets/focus_pane.py +137 -35
autobyteus/cli/workflow_tui/widgets/renderables.py +1 -1
autobyteus/cli/workflow_tui/widgets/shared.py +25 -25
autobyteus/clients/autobyteus_client.py +94 -1
autobyteus/events/event_types.py +11 -18
autobyteus/llm/api/autobyteus_llm.py +33 -29
autobyteus/llm/api/claude_llm.py +142 -36
autobyteus/llm/api/gemini_llm.py +163 -59
autobyteus/llm/api/grok_llm.py +1 -1
autobyteus/llm/api/minimax_llm.py +26 -0
autobyteus/llm/api/mistral_llm.py +113 -87
autobyteus/llm/api/ollama_llm.py +9 -42
autobyteus/llm/api/openai_compatible_llm.py +127 -91
autobyteus/llm/api/openai_llm.py +3 -3
autobyteus/llm/api/openai_responses_llm.py +324 -0
autobyteus/llm/api/zhipu_llm.py +21 -2
autobyteus/llm/autobyteus_provider.py +70 -60
autobyteus/llm/base_llm.py +85 -81
autobyteus/llm/converters/__init__.py +14 -0
autobyteus/llm/converters/anthropic_tool_call_converter.py +37 -0
autobyteus/llm/converters/gemini_tool_call_converter.py +57 -0
autobyteus/llm/converters/mistral_tool_call_converter.py +37 -0
autobyteus/llm/converters/openai_tool_call_converter.py +38 -0
autobyteus/llm/extensions/base_extension.py +6 -12
autobyteus/llm/extensions/token_usage_tracking_extension.py +45 -18
autobyteus/llm/llm_factory.py +282 -204
autobyteus/llm/lmstudio_provider.py +60 -49
autobyteus/llm/models.py +35 -2
autobyteus/llm/ollama_provider.py +60 -49
autobyteus/llm/ollama_provider_resolver.py +0 -1
autobyteus/llm/prompt_renderers/__init__.py +19 -0
autobyteus/llm/prompt_renderers/anthropic_prompt_renderer.py +104 -0
autobyteus/llm/prompt_renderers/autobyteus_prompt_renderer.py +19 -0
autobyteus/llm/prompt_renderers/base_prompt_renderer.py +10 -0
autobyteus/llm/prompt_renderers/gemini_prompt_renderer.py +63 -0
autobyteus/llm/prompt_renderers/mistral_prompt_renderer.py +87 -0
autobyteus/llm/prompt_renderers/ollama_prompt_renderer.py +51 -0
autobyteus/llm/prompt_renderers/openai_chat_renderer.py +97 -0
autobyteus/llm/prompt_renderers/openai_responses_renderer.py +101 -0
autobyteus/llm/providers.py +1 -3
autobyteus/llm/token_counter/claude_token_counter.py +56 -25
autobyteus/llm/token_counter/mistral_token_counter.py +12 -8
autobyteus/llm/token_counter/openai_token_counter.py +24 -5
autobyteus/llm/token_counter/token_counter_factory.py +12 -5
autobyteus/llm/utils/llm_config.py +6 -12
autobyteus/llm/utils/media_payload_formatter.py +27 -20
autobyteus/llm/utils/messages.py +55 -3
autobyteus/llm/utils/response_types.py +3 -0
autobyteus/llm/utils/tool_call_delta.py +31 -0
autobyteus/memory/__init__.py +32 -0
autobyteus/memory/active_transcript.py +69 -0
autobyteus/memory/compaction/__init__.py +9 -0
autobyteus/memory/compaction/compaction_result.py +8 -0
autobyteus/memory/compaction/compactor.py +89 -0
autobyteus/memory/compaction/summarizer.py +11 -0
autobyteus/memory/compaction_snapshot_builder.py +84 -0
autobyteus/memory/memory_manager.py +183 -0
autobyteus/memory/models/__init__.py +14 -0
autobyteus/memory/models/episodic_item.py +41 -0
autobyteus/memory/models/memory_types.py +7 -0
autobyteus/memory/models/raw_trace_item.py +79 -0
autobyteus/memory/models/semantic_item.py +41 -0
autobyteus/memory/models/tool_interaction.py +20 -0
autobyteus/memory/policies/__init__.py +5 -0
autobyteus/memory/policies/compaction_policy.py +16 -0
autobyteus/memory/retrieval/__init__.py +7 -0
autobyteus/memory/retrieval/memory_bundle.py +11 -0
autobyteus/memory/retrieval/retriever.py +13 -0
autobyteus/memory/store/__init__.py +7 -0
autobyteus/memory/store/base_store.py +14 -0
autobyteus/memory/store/file_store.py +98 -0
autobyteus/memory/tool_interaction_builder.py +46 -0
autobyteus/memory/turn_tracker.py +9 -0
autobyteus/multimedia/audio/api/autobyteus_audio_client.py +19 -5
autobyteus/multimedia/audio/api/gemini_audio_client.py +108 -16
autobyteus/multimedia/audio/audio_client_factory.py +47 -9
autobyteus/multimedia/audio/audio_model.py +2 -1
autobyteus/multimedia/image/api/autobyteus_image_client.py +19 -5
autobyteus/multimedia/image/api/gemini_image_client.py +38 -17
autobyteus/multimedia/image/api/openai_image_client.py +125 -43
autobyteus/multimedia/image/autobyteus_image_provider.py +2 -1
autobyteus/multimedia/image/image_client_factory.py +47 -15
autobyteus/multimedia/image/image_model.py +5 -2
autobyteus/multimedia/providers.py +3 -2
autobyteus/skills/loader.py +71 -0
autobyteus/skills/model.py +11 -0
autobyteus/skills/registry.py +70 -0
autobyteus/task_management/tools/todo_tools/add_todo.py +2 -2
autobyteus/task_management/tools/todo_tools/create_todo_list.py +2 -2
autobyteus/task_management/tools/todo_tools/update_todo_status.py +2 -2
autobyteus/tools/__init__.py +34 -47
autobyteus/tools/base_tool.py +7 -0
autobyteus/tools/file/__init__.py +2 -6
autobyteus/tools/file/patch_file.py +149 -0
autobyteus/tools/file/read_file.py +36 -5
autobyteus/tools/file/write_file.py +4 -1
autobyteus/tools/functional_tool.py +43 -6
autobyteus/tools/mcp/__init__.py +2 -0
autobyteus/tools/mcp/config_service.py +5 -1
autobyteus/tools/mcp/server/__init__.py +2 -0
autobyteus/tools/mcp/server/http_managed_mcp_server.py +1 -1
autobyteus/tools/mcp/server/websocket_managed_mcp_server.py +141 -0
autobyteus/tools/mcp/server_instance_manager.py +8 -1
autobyteus/tools/mcp/types.py +61 -0
autobyteus/tools/multimedia/audio_tools.py +70 -17
autobyteus/tools/multimedia/download_media_tool.py +18 -4
autobyteus/tools/multimedia/image_tools.py +246 -62
autobyteus/tools/operation_executor/journal_manager.py +107 -0
autobyteus/tools/operation_executor/operation_event_buffer.py +57 -0
autobyteus/tools/operation_executor/operation_event_producer.py +29 -0
autobyteus/tools/operation_executor/operation_executor.py +58 -0
autobyteus/tools/registry/tool_definition.py +43 -2
autobyteus/tools/skill/load_skill.py +50 -0
autobyteus/tools/terminal/__init__.py +45 -0
autobyteus/tools/terminal/ansi_utils.py +32 -0
autobyteus/tools/terminal/background_process_manager.py +233 -0
autobyteus/tools/terminal/output_buffer.py +105 -0
autobyteus/tools/terminal/prompt_detector.py +63 -0
autobyteus/tools/terminal/pty_session.py +241 -0
autobyteus/tools/terminal/session_factory.py +20 -0
autobyteus/tools/terminal/terminal_session_manager.py +226 -0
autobyteus/tools/terminal/tools/__init__.py +13 -0
autobyteus/tools/terminal/tools/get_process_output.py +81 -0
autobyteus/tools/terminal/tools/run_bash.py +109 -0
autobyteus/tools/terminal/tools/start_background_process.py +104 -0
autobyteus/tools/terminal/tools/stop_background_process.py +67 -0
autobyteus/tools/terminal/types.py +54 -0
autobyteus/tools/terminal/wsl_tmux_session.py +221 -0
autobyteus/tools/terminal/wsl_utils.py +156 -0
autobyteus/tools/transaction_management/backup_handler.py +48 -0
autobyteus/tools/transaction_management/operation_lifecycle_manager.py +62 -0
autobyteus/tools/usage/__init__.py +1 -2
autobyteus/tools/usage/formatters/__init__.py +17 -1
autobyteus/tools/usage/formatters/base_formatter.py +8 -0
autobyteus/tools/usage/formatters/default_xml_schema_formatter.py +2 -2
autobyteus/tools/usage/formatters/mistral_json_schema_formatter.py +18 -0
autobyteus/tools/usage/formatters/patch_file_xml_example_formatter.py +64 -0
autobyteus/tools/usage/formatters/patch_file_xml_schema_formatter.py +31 -0
autobyteus/tools/usage/formatters/run_bash_xml_example_formatter.py +32 -0
autobyteus/tools/usage/formatters/run_bash_xml_schema_formatter.py +36 -0
autobyteus/tools/usage/formatters/write_file_xml_example_formatter.py +53 -0
autobyteus/tools/usage/formatters/write_file_xml_schema_formatter.py +31 -0
autobyteus/tools/usage/providers/tool_manifest_provider.py +10 -10
autobyteus/tools/usage/registries/__init__.py +1 -3
autobyteus/tools/usage/registries/tool_formatting_registry.py +115 -8
autobyteus/tools/usage/tool_schema_provider.py +51 -0
autobyteus/tools/web/__init__.py +4 -0
autobyteus/tools/web/read_url_tool.py +80 -0
autobyteus/utils/diff_utils.py +271 -0
autobyteus/utils/download_utils.py +109 -0
autobyteus/utils/file_utils.py +57 -2
autobyteus/utils/gemini_helper.py +56 -0
autobyteus/utils/gemini_model_mapping.py +71 -0
autobyteus/utils/llm_output_formatter.py +75 -0
autobyteus/utils/tool_call_format.py +36 -0
autobyteus/workflow/agentic_workflow.py +3 -3
autobyteus/workflow/bootstrap_steps/agent_tool_injection_step.py +2 -2
autobyteus/workflow/bootstrap_steps/base_workflow_bootstrap_step.py +2 -2
autobyteus/workflow/bootstrap_steps/coordinator_initialization_step.py +2 -2
autobyteus/workflow/bootstrap_steps/coordinator_prompt_preparation_step.py +3 -9
autobyteus/workflow/bootstrap_steps/workflow_bootstrapper.py +6 -6
autobyteus/workflow/bootstrap_steps/workflow_runtime_queue_initialization_step.py +2 -2
autobyteus/workflow/context/workflow_context.py +3 -3
autobyteus/workflow/context/workflow_runtime_state.py +5 -5
autobyteus/workflow/events/workflow_event_dispatcher.py +5 -5
autobyteus/workflow/handlers/lifecycle_workflow_event_handler.py +3 -3
autobyteus/workflow/handlers/process_user_message_event_handler.py +5 -5
autobyteus/workflow/handlers/tool_approval_workflow_event_handler.py +2 -2
autobyteus/workflow/runtime/workflow_runtime.py +8 -8
autobyteus/workflow/runtime/workflow_worker.py +3 -3
autobyteus/workflow/status/__init__.py +11 -0
autobyteus/workflow/status/workflow_status.py +19 -0
autobyteus/workflow/status/workflow_status_manager.py +48 -0
autobyteus/workflow/streaming/__init__.py +2 -2
autobyteus/workflow/streaming/workflow_event_notifier.py +7 -7
autobyteus/workflow/streaming/workflow_stream_event_payloads.py +4 -4
autobyteus/workflow/streaming/workflow_stream_events.py +3 -3
autobyteus/workflow/utils/wait_for_idle.py +4 -4
autobyteus-1.2.3.dist-info/METADATA +293 -0
autobyteus-1.2.3.dist-info/RECORD +600 -0
{autobyteus-1.2.1.dist-info → autobyteus-1.2.3.dist-info}/WHEEL +1 -1
{autobyteus-1.2.1.dist-info → autobyteus-1.2.3.dist-info}/top_level.txt +0 -1
autobyteus/agent/bootstrap_steps/agent_runtime_queue_initialization_step.py +0 -57
autobyteus/agent/hooks/__init__.py +0 -16
autobyteus/agent/hooks/base_phase_hook.py +0 -78
autobyteus/agent/hooks/hook_definition.py +0 -36
autobyteus/agent/hooks/hook_meta.py +0 -37
autobyteus/agent/hooks/hook_registry.py +0 -106
autobyteus/agent/llm_response_processor/provider_aware_tool_usage_processor.py +0 -103
autobyteus/agent/phases/__init__.py +0 -18
autobyteus/agent/phases/discover.py +0 -53
autobyteus/agent/phases/manager.py +0 -265
autobyteus/agent/phases/transition_decorator.py +0 -40
autobyteus/agent/phases/transition_info.py +0 -33
autobyteus/agent/remote_agent.py +0 -244
autobyteus/agent/workspace/workspace_definition.py +0 -36
autobyteus/agent/workspace/workspace_meta.py +0 -37
autobyteus/agent/workspace/workspace_registry.py +0 -72
autobyteus/agent_team/bootstrap_steps/agent_team_runtime_queue_initialization_step.py +0 -25
autobyteus/agent_team/bootstrap_steps/coordinator_prompt_preparation_step.py +0 -85
autobyteus/agent_team/phases/__init__.py +0 -11
autobyteus/agent_team/phases/agent_team_operational_phase.py +0 -19
autobyteus/agent_team/phases/agent_team_phase_manager.py +0 -48
autobyteus/llm/api/bedrock_llm.py +0 -92
autobyteus/llm/api/groq_llm.py +0 -94
autobyteus/llm/api/nvidia_llm.py +0 -108
autobyteus/llm/utils/token_pricing_config.py +0 -87
autobyteus/rpc/__init__.py +0 -73
autobyteus/rpc/client/__init__.py +0 -17
autobyteus/rpc/client/abstract_client_connection.py +0 -124
autobyteus/rpc/client/client_connection_manager.py +0 -153
autobyteus/rpc/client/sse_client_connection.py +0 -306
autobyteus/rpc/client/stdio_client_connection.py +0 -280
autobyteus/rpc/config/__init__.py +0 -13
autobyteus/rpc/config/agent_server_config.py +0 -153
autobyteus/rpc/config/agent_server_registry.py +0 -152
autobyteus/rpc/hosting.py +0 -244
autobyteus/rpc/protocol.py +0 -244
autobyteus/rpc/server/__init__.py +0 -20
autobyteus/rpc/server/agent_server_endpoint.py +0 -181
autobyteus/rpc/server/base_method_handler.py +0 -40
autobyteus/rpc/server/method_handlers.py +0 -259
autobyteus/rpc/server/sse_server_handler.py +0 -182
autobyteus/rpc/server/stdio_server_handler.py +0 -151
autobyteus/rpc/server_main.py +0 -198
autobyteus/rpc/transport_type.py +0 -13
autobyteus/tools/bash/__init__.py +0 -2
autobyteus/tools/bash/bash_executor.py +0 -100
autobyteus/tools/browser/__init__.py +0 -2
autobyteus/tools/browser/session_aware/browser_session_aware_navigate_to.py +0 -75
autobyteus/tools/browser/session_aware/browser_session_aware_tool.py +0 -30
autobyteus/tools/browser/session_aware/browser_session_aware_web_element_trigger.py +0 -154
autobyteus/tools/browser/session_aware/browser_session_aware_webpage_reader.py +0 -89
autobyteus/tools/browser/session_aware/browser_session_aware_webpage_screenshot_taker.py +0 -107
autobyteus/tools/browser/session_aware/factory/browser_session_aware_web_element_trigger_factory.py +0 -14
autobyteus/tools/browser/session_aware/factory/browser_session_aware_webpage_reader_factory.py +0 -26
autobyteus/tools/browser/session_aware/factory/browser_session_aware_webpage_screenshot_taker_factory.py +0 -14
autobyteus/tools/browser/session_aware/shared_browser_session.py +0 -11
autobyteus/tools/browser/session_aware/shared_browser_session_manager.py +0 -25
autobyteus/tools/browser/session_aware/web_element_action.py +0 -20
autobyteus/tools/browser/standalone/__init__.py +0 -6
autobyteus/tools/browser/standalone/factory/__init__.py +0 -0
autobyteus/tools/browser/standalone/factory/webpage_reader_factory.py +0 -25
autobyteus/tools/browser/standalone/factory/webpage_screenshot_taker_factory.py +0 -14
autobyteus/tools/browser/standalone/navigate_to.py +0 -84
autobyteus/tools/browser/standalone/web_page_pdf_generator.py +0 -101
autobyteus/tools/browser/standalone/webpage_image_downloader.py +0 -169
autobyteus/tools/browser/standalone/webpage_reader.py +0 -105
autobyteus/tools/browser/standalone/webpage_screenshot_taker.py +0 -105
autobyteus/tools/file/edit_file.py +0 -200
autobyteus/tools/file/list_directory.py +0 -168
autobyteus/tools/file/search_files.py +0 -188
autobyteus/tools/timer.py +0 -175
autobyteus/tools/usage/parsers/__init__.py +0 -22
autobyteus/tools/usage/parsers/_json_extractor.py +0 -99
autobyteus/tools/usage/parsers/_string_decoders.py +0 -18
autobyteus/tools/usage/parsers/anthropic_xml_tool_usage_parser.py +0 -10
autobyteus/tools/usage/parsers/base_parser.py +0 -41
autobyteus/tools/usage/parsers/default_json_tool_usage_parser.py +0 -83
autobyteus/tools/usage/parsers/default_xml_tool_usage_parser.py +0 -316
autobyteus/tools/usage/parsers/exceptions.py +0 -13
autobyteus/tools/usage/parsers/gemini_json_tool_usage_parser.py +0 -77
autobyteus/tools/usage/parsers/openai_json_tool_usage_parser.py +0 -149
autobyteus/tools/usage/parsers/provider_aware_tool_usage_parser.py +0 -59
autobyteus/tools/usage/registries/tool_usage_parser_registry.py +0 -62
autobyteus/workflow/phases/__init__.py +0 -11
autobyteus/workflow/phases/workflow_operational_phase.py +0 -19
autobyteus/workflow/phases/workflow_phase_manager.py +0 -48
autobyteus-1.2.1.dist-info/METADATA +0 -205
autobyteus-1.2.1.dist-info/RECORD +0 -511
examples/__init__.py +0 -1
examples/agent_team/__init__.py +0 -1
examples/discover_phase_transitions.py +0 -104
examples/run_agentic_software_engineer.py +0 -239
examples/run_browser_agent.py +0 -262
examples/run_google_slides_agent.py +0 -287
examples/run_mcp_browser_client.py +0 -174
examples/run_mcp_google_slides_client.py +0 -270
examples/run_mcp_list_tools.py +0 -189
examples/run_poem_writer.py +0 -284
examples/run_sqlite_agent.py +0 -295
/autobyteus/{tools/browser/session_aware → skills}/__init__.py +0 -0
/autobyteus/tools/{browser/session_aware/factory → skill}/__init__.py +0 -0
{autobyteus-1.2.1.dist-info → autobyteus-1.2.3.dist-info}/licenses/LICENSE +0 -0

autobyteus/multimedia/audio/audio_client_factory.py CHANGED Viewed

@@ -13,13 +13,51 @@ from autobyteus.utils.parameter_schema import ParameterSchema, ParameterDefiniti
 logger = logging.getLogger(__name__)
-GEMINI_TTS_VOICES = [
-    "Zephyr", "Puck", "Charon", "Kore", "Fenrir", "Leda", "Orus", "Aoede",
-    "Callirrhoe", "Autonoe", "Enceladus", "Iapetus", "Umbriel", "Algieba",
-    "Despina", "Erinome", "Algenib", "Rasalgethi", "Laomedeia", "Achernar",
-    "Alnilam", "Schedar", "Gacrux", "Pulcherrima", "Achird", "Zubenelgenubi",
-    "Vindemiatrix", "Sadachbia", "Sadaltager", "Sulafat"
+# Enhanced metadata for Google Gemini TTS voices, including gender and description.
+GEMINI_VOICE_DETAILS = {
+    "Zephyr": {"gender": "female", "description": "Bright, Higher pitch"},
+    "Puck": {"gender": "male", "description": "Upbeat, Middle pitch"},
+    "Charon": {"gender": "male", "description": "Informative, Lower pitch"},
+    "Kore": {"gender": "female", "description": "Firm, Middle pitch"},
+    "Fenrir": {"gender": "male", "description": "Excitable, Lower middle pitch"},
+    "Leda": {"gender": "female", "description": "Youthful, Higher pitch"},
+    "Orus": {"gender": "male", "description": "Firm, Lower middle pitch"},
+    "Aoede": {"gender": "female", "description": "Breezy, Middle pitch"},
+    "Callirrhoe": {"gender": "female", "description": "Easy-going, Middle pitch"},
+    "Autonoe": {"gender": "female", "description": "Bright, Middle pitch"},
+    "Enceladus": {"gender": "male", "description": "Breathy, Lower pitch"},
+    "Iapetus": {"gender": "male", "description": "Clear, Lower middle pitch"},
+    "Umbriel": {"gender": "male", "description": "Easy-going, Lower middle pitch"},
+    "Algieba": {"gender": "male", "description": "Smooth, Lower pitch"},
+    "Despina": {"gender": "female", "description": "Smooth, Middle pitch"},
+    "Erinome": {"gender": "female", "description": "Clear, Middle pitch"},
+    "Algenib": {"gender": "male", "description": "Gravelly, Lower pitch"},
+    "Rasalgethi": {"gender": "male", "description": "Informative, Middle pitch"},
+    "Laomedeia": {"gender": "female", "description": "Upbeat, Higher pitch"},
+    "Achernar": {"gender": "female", "description": "Soft, Higher pitch"},
+    "Alnilam": {"gender": "male", "description": "Firm, Lower middle pitch"},
+    "Schedar": {"gender": "male", "description": "Even, Lower middle pitch"},
+    "Gacrux": {"gender": "female", "description": "Mature, Middle pitch"},
+    "Pulcherrima": {"gender": "female", "description": "Forward, Middle pitch"},
+    "Achird": {"gender": "male", "description": "Friendly, Lower middle pitch"},
+    "Zubenelgenubi": {"gender": "male", "description": "Casual, Lower middle pitch"},
+    "Vindemiatrix": {"gender": "female", "description": "Gentle, Middle pitch"},
+    "Sadachbia": {"gender": "male", "description": "Lively, Lower pitch"},
+    "Sadaltager": {"gender": "male", "description": "Knowledgeable, Middle pitch"},
+    "Sulafat": {"gender": "female", "description": "Warm, Middle pitch"},
+}
+# The list of voice names, derived from the keys of the details dictionary.
+# This is used for the `enum_values` to maintain compatibility.
+GEMINI_TTS_VOICES = list(GEMINI_VOICE_DETAILS.keys())
+# Generate a formatted string of voice metadata to be appended to parameter descriptions.
+_voice_descriptions_list = [
+    f"- {name} ({details['gender']}): {details['description']}"
+    for name, details in GEMINI_VOICE_DETAILS.items()
 ]
+GEMINI_VOICE_METADATA_DESC = "\n\nDetailed Voice Options:\n" + "\n".join(_voice_descriptions_list)
 OPENAI_TTS_VOICES = [
     "alloy", "ash", "ballad", "coral", "echo", "fable", "onyx",
@@ -64,7 +102,7 @@ class AudioClientFactory(metaclass=SingletonMeta):
             ParameterDefinition(
                 name="voice",
                 param_type=ParameterType.ENUM,
-                description="The voice to assign to this speaker.",
+                description="The voice to assign to this speaker." + GEMINI_VOICE_METADATA_DESC,
                 enum_values=GEMINI_TTS_VOICES,
                 required=True
             )
@@ -84,7 +122,7 @@ class AudioClientFactory(metaclass=SingletonMeta):
                 param_type=ParameterType.ENUM,
                 default_value="Kore",
                 enum_values=GEMINI_TTS_VOICES,
-                description="The voice to use for single-speaker generation."
+                description="The voice to use for single-speaker generation." + GEMINI_VOICE_METADATA_DESC
             ),
             ParameterDefinition(
                 name="style_instructions",
@@ -102,7 +140,7 @@ class AudioClientFactory(metaclass=SingletonMeta):
         gemini_tts_model = AudioModel(
             name="gemini-2.5-flash-tts",
             value="gemini-2.5-flash-preview-tts",
-            provider=MultimediaProvider.GOOGLE,
+            provider=MultimediaProvider.GEMINI,
             client_class=GeminiAudioClient,
             parameter_schema=gemini_tts_schema
         )

autobyteus/multimedia/audio/audio_model.py CHANGED Viewed

@@ -79,7 +79,8 @@ class AudioModel(metaclass=AudioModelMeta):
         """Returns the unique identifier for the model."""
         if self.runtime == MultimediaRuntime.AUTOBYTEUS and self.host_url:
             try:
-                host = urlparse(self.host_url).hostname
+                parsed = urlparse(self.host_url)
+                host = parsed.netloc or parsed.hostname or self.host_url
                 return f"{self.name}@{host}"
             except Exception:
                 return f"{self.name}@{self.host_url}" # Fallback

autobyteus/multimedia/image/api/autobyteus_image_client.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import logging
+import uuid
 from typing import Optional, List, Dict, Any, TYPE_CHECKING
 from autobyteus.clients import AutobyteusClient
 from autobyteus.multimedia.image.base_image_client import BaseImageClient
@@ -13,6 +14,7 @@ logger = logging.getLogger(__name__)
 class AutobyteusImageClient(BaseImageClient):
     """
     An image client that connects to an Autobyteus LLM server instance for image tasks.
+    Maintains a persistent session ID for stateful interactions (e.g. conversational editing).
     """
     def __init__(self, model: "ImageModel", config: "MultimediaConfig"):
@@ -21,7 +23,9 @@ class AutobyteusImageClient(BaseImageClient):
             raise ValueError("AutobyteusImageClient requires a host_url in its ImageModel.")
         self.autobyteus_client = AutobyteusClient(server_url=model.host_url)
-        logger.info(f"AutobyteusImageClient initialized for model '{self.model.name}' on host '{model.host_url}'.")
+        self.session_id = str(uuid.uuid4())
+        logger.info(f"AutobyteusImageClient initialized for model '{self.model.name}' "
+                    f"on host '{model.host_url}' with session_id '{self.session_id}'.")
     async def generate_image(
         self,
@@ -72,7 +76,7 @@ class AutobyteusImageClient(BaseImageClient):
     ) -> ImageGenerationResponse:
         """Internal helper to call the remote server."""
         try:
-            logger.info(f"Sending image generation request for model '{self.model.name}' to {self.model.host_url}")
+            logger.info(f"Sending image generation request for model '{self.model.name}' to {self.model.host_url} (Session: {self.session_id})")
             # The model name for the remote server is the `value`, not the unique `model_identifier`
             model_name_for_server = self.model.name
@@ -84,7 +88,8 @@ class AutobyteusImageClient(BaseImageClient):
                 prompt=prompt,
                 input_image_urls=input_image_urls,
                 mask_url=mask_url,
-                generation_config=generation_config
+                generation_config=generation_config,
+                session_id=self.session_id
             )
             image_urls = response_data.get("image_urls", [])
@@ -98,7 +103,16 @@ class AutobyteusImageClient(BaseImageClient):
             raise
     async def cleanup(self):
-        """Closes the underlying AutobyteusClient."""
+        """
+        Notifies the server to cleanup the session, then closes the underlying HTTP client.
+        """
         if self.autobyteus_client:
-            await self.autobyteus_client.close()
+            try:
+                logger.info(f"Notifying server to cleanup image session '{self.session_id}'...")
+                await self.autobyteus_client.cleanup_image_session(self.session_id)
+            except Exception as e:
+                logger.error(f"Failed to cleanup remote image session '{self.session_id}': {e}")
+            finally:
+                await self.autobyteus_client.close()
         logger.debug("AutobyteusImageClient cleaned up.")

autobyteus/multimedia/image/api/gemini_image_client.py CHANGED Viewed

@@ -1,14 +1,13 @@
 import logging
 import base64
-import os
 from typing import Optional, List, Dict, Any, TYPE_CHECKING
-from google import genai
-from PIL import Image
-import requests
+from google.genai import types as genai_types
 from autobyteus.multimedia.image.base_image_client import BaseImageClient
 from autobyteus.multimedia.utils.response_types import ImageGenerationResponse
 from autobyteus.multimedia.utils.api_utils import load_image_from_url
+from autobyteus.utils.gemini_helper import initialize_gemini_client_with_runtime
+from autobyteus.utils.gemini_model_mapping import resolve_model_for_runtime
 if TYPE_CHECKING:
     from autobyteus.multimedia.image.image_model import ImageModel
@@ -21,17 +20,15 @@ class GeminiImageClient(BaseImageClient):
     An image client that uses Google's Gemini models for image generation tasks.
     **Setup Requirements:**
-    1.  **Authentication:** Set the `GEMINI_API_KEY` environment variable with your API key.
+    1.  **AI Studio Mode:** Set `GEMINI_API_KEY`.
+    2.  **Vertex AI Mode:** Set `VERTEX_AI_PROJECT` and `VERTEX_AI_LOCATION`.
     """
     def __init__(self, model: "ImageModel", config: "MultimediaConfig"):
         super().__init__(model, config)
-        api_key = os.getenv("GEMINI_API_KEY")
-        if not api_key:
-            raise ValueError("Please set the GEMINI_API_KEY environment variable.")
         try:
-            self.client = genai.Client()
+            self.client, self.runtime_info = initialize_gemini_client_with_runtime()
             self.async_client = self.client.aio
             logger.info(f"GeminiImageClient initialized for model '{self.model.name}'.")
         except Exception as e:
@@ -60,16 +57,40 @@ class GeminiImageClient(BaseImageClient):
                     except Exception as e:
                         logger.error(f"Skipping image at '{url}' due to loading error: {e}")
-            # Note: The google-genai library uses the synchronous client for the `.generate_content` method on a model
-            # even in an async context, as there isn't a direct async equivalent exposed for this specific call on the model object.
-            # We use the top-level async client for other potential future calls if the library API changes.
-            model_instance = self.client.get_generative_model(model_name=f"models/{self.model.value}")
-            response = await model_instance.generate_content_async(contents=content)
+            config_dict: Dict[str, Any] = {}
+            if self.config and self.config.params:
+                config_dict.update(self.config.params)
+            if generation_config:
+                config_dict.update(generation_config)
+            if "response_modalities" not in config_dict:
+                if getattr(self, "runtime_info", None) and self.runtime_info.runtime == "vertex":
+                    config_dict["response_modalities"] = ["TEXT", "IMAGE"]
+                else:
+                    config_dict["response_modalities"] = ["IMAGE"]
+            config = genai_types.GenerateContentConfig(**config_dict)
+            # FIX: Removed 'models/' prefix from model_name to support Vertex AI
+            runtime_adjusted_model = resolve_model_for_runtime(
+                self.model.value,
+                modality="image",
+                runtime=getattr(self, "runtime_info", None) and self.runtime_info.runtime,
+            )
+            if runtime_adjusted_model != self.model.value:
+                logger.info(
+                    "Using runtime-adjusted Gemini image model '%s' (requested '%s').",
+                    runtime_adjusted_model,
+                    self.model.value,
+                )
+            response = await self.async_client.models.generate_content(
+                model=runtime_adjusted_model,
+                contents=content,
+                config=config,
+            )
             image_urls = []
-            for part in response.parts:
-                if part.inline_data and "image" in part.inline_data.mime_type:
+            for part in response.parts or []:
+                if part.inline_data and part.inline_data.mime_type and "image" in part.inline_data.mime_type:
                     image_bytes = part.inline_data.data
                     base64_image = base64.b64encode(image_bytes).decode("utf-8")
                     data_uri = f"data:{part.inline_data.mime_type};base64,{base64_image}"
@@ -77,7 +98,7 @@ class GeminiImageClient(BaseImageClient):
             if not image_urls:
                 # Check for a safety-related refusal to generate content
-                if response.prompt_feedback.block_reason:
+                if response.prompt_feedback and response.prompt_feedback.block_reason:
                     reason = response.prompt_feedback.block_reason.name
                     logger.error(f"Image generation blocked due to safety settings. Reason: {reason}")
                     raise ValueError(f"Image generation failed due to safety settings: {reason}")

autobyteus/multimedia/image/api/openai_image_client.py CHANGED Viewed

@@ -1,9 +1,14 @@
 import logging
 import os
+import tempfile
+from pathlib import Path
 from typing import Optional, List, Dict, Any, TYPE_CHECKING
 from openai import OpenAI
 from autobyteus.multimedia.image.base_image_client import BaseImageClient
 from autobyteus.multimedia.utils.response_types import ImageGenerationResponse
+from autobyteus.utils.download_utils import download_file_from_url
 if TYPE_CHECKING:
     from autobyteus.multimedia.image.image_model import ImageModel
@@ -11,9 +16,19 @@ if TYPE_CHECKING:
 logger = logging.getLogger(__name__)
+def _mime_type_from_format(output_format: str) -> str:
+    fmt = (output_format or "png").lower()
+    if fmt in {"jpg", "jpeg"}:
+        return "image/jpeg"
+    if fmt == "webp":
+        return "image/webp"
+    return "image/png"
 class OpenAIImageClient(BaseImageClient):
     """
-    An image client that uses OpenAI's DALL-E models.
+    An image client that uses OpenAI's gpt-image series via the images API.
     """
     def __init__(self, model: "ImageModel", config: "MultimediaConfig"):
@@ -34,49 +49,68 @@ class OpenAIImageClient(BaseImageClient):
         **kwargs
     ) -> ImageGenerationResponse:
         """
-        Generates an image using an OpenAI DALL-E model via the v1/images/generations endpoint.
-        Note: This endpoint does not support image inputs, even for multimodal models like gpt-image-1.
+        Generates an image using OpenAI's images generation endpoint.
+        Note: This endpoint does not support image inputs.
         """
         if input_image_urls:
             logger.warning(
-                f"The OpenAI `images.generate` API used by this client does not support input images. "
-                f"The images provided for model '{self.model.value}' will be ignored. "
-                f"To use image inputs, a client based on the Chat Completions API is required."
+                "The OpenAI `images.generate` API used by this client does not support input images. "
+                "The images provided for model '%s' will be ignored. "
+                "To use image inputs, a client based on the Chat Completions API is required.",
+                self.model.value,
             )
         try:
             image_model = self.model.value
-            logger.info(f"Generating image with OpenAI model '{image_model}' and prompt: '{prompt[:50]}...'")
+            logger.info("Generating image with OpenAI model '%s' and prompt: '%s...'", image_model, prompt[:50])
             # Combine default config with any overrides
             final_config = self.config.to_dict().copy()
             if generation_config:
                 final_config.update(generation_config)
-            response = self.client.images.generate(
-                model=image_model,
-                prompt=prompt,
-                n=final_config.get("n", 1),
-                size=final_config.get("size", "1024x1024"),
-                quality=final_config.get("quality", "standard"),
-                style=final_config.get("style", "vivid"),
-                response_format="url"
+            # Always request a single image for simplicity
+            final_config["n"] = 1
+            request_kwargs = {
+                "model": image_model,
+                "prompt": prompt,
+                "n": 1,
+                "size": final_config.get("size", "1024x1024"),
+                "quality": final_config.get("quality", "standard"),
+            }
+            if "output_format" in final_config:
+                request_kwargs["output_format"] = final_config["output_format"]
+            if "output_compression" in final_config:
+                request_kwargs["output_compression"] = final_config["output_compression"]
+            response = self.client.images.generate(**request_kwargs)
+            output_format = final_config.get("output_format", "png")
+            mime_type = _mime_type_from_format(output_format)
+            image_urls_list: List[str] = []
+            for img in response.data:
+                if getattr(img, "url", None):
+                    image_urls_list.append(img.url)
+                elif getattr(img, "b64_json", None):
+                    image_urls_list.append(f"data:{mime_type};base64,{img.b64_json}")
+            revised_prompt: Optional[str] = (
+                response.data[0].revised_prompt
+                if response.data and hasattr(response.data[0], "revised_prompt")
+                else None
             )
-            image_urls_list: List[str] = [img.url for img in response.data if img.url]
-            revised_prompt: Optional[str] = response.data[0].revised_prompt if response.data and hasattr(response.data[0], 'revised_prompt') else None
             if not image_urls_list:
-                raise ValueError("OpenAI API did not return any image URLs.")
+                raise ValueError("OpenAI API did not return any image data.")
-            logger.info(f"Successfully generated {len(image_urls_list)} image(s).")
+            logger.info("Successfully generated %s image(s).", len(image_urls_list))
             return ImageGenerationResponse(
                 image_urls=image_urls_list,
                 revised_prompt=revised_prompt
             )
         except Exception as e:
-            logger.error(f"Error during OpenAI image generation: {str(e)}")
+            logger.error("Error during OpenAI image generation: %s", str(e))
             raise ValueError(f"OpenAI image generation failed: {str(e)}")
     async def edit_image(
@@ -95,49 +129,97 @@ class OpenAIImageClient(BaseImageClient):
         source_image_url = input_image_urls[0]
         if len(input_image_urls) > 1:
-            logger.warning(f"OpenAI edit endpoint only supports one input image. Using '{source_image_url}' and ignoring the rest.")
+            logger.warning(
+                "OpenAI edit endpoint only supports one input image. Using '%s' and ignoring the rest.",
+                source_image_url,
+            )
+        temp_image_path: Optional[Path] = None
+        temp_mask_path: Optional[Path] = None
         try:
-            logger.info(f"Editing image '{source_image_url}' with prompt: '{prompt[:50]}...'")
+            logger.info("Editing image '%s' with prompt: '%s...'", source_image_url, prompt[:50])
             # Combine default config with any overrides
             final_config = self.config.to_dict().copy()
             if generation_config:
                 final_config.update(generation_config)
-            with open(source_image_url, "rb") as image_file:
-                mask_file = open(mask_url, "rb") if mask_url else None
+            # Always request a single edited image
+            final_config["n"] = 1
+            source_path = Path(source_image_url)
+            if not source_path.exists():
+                temp_image_file = tempfile.NamedTemporaryFile(delete=False, suffix=".png")
+                temp_image_file.close()
+                temp_image_path = Path(temp_image_file.name)
+                await download_file_from_url(source_image_url, temp_image_path)
+                source_path = temp_image_path
+            if mask_url:
+                mask_path = Path(mask_url)
+                if not mask_path.exists():
+                    temp_mask_file = tempfile.NamedTemporaryFile(delete=False, suffix=".png")
+                    temp_mask_file.close()
+                    temp_mask_path = Path(temp_mask_file.name)
+                    await download_file_from_url(mask_url, temp_mask_path)
+                    mask_path = temp_mask_path
+            else:
+                mask_path = None
+            with open(source_path, "rb") as image_file:
+                mask_file = open(mask_path, "rb") if mask_path else None
                 try:
-                    response = self.client.images.edit(
-                        image=image_file,
-                        mask=mask_file,
-                        prompt=prompt,
-                        model=self.model.value,
-                        n=final_config.get("n", 1),
-                        size=final_config.get("size", "1024x1024"),
-                        response_format="url"
-                    )
+                    request_kwargs = {
+                        "image": image_file,
+                        "prompt": prompt,
+                        "model": self.model.value,
+                        "n": final_config.get("n", 1),
+                        "size": final_config.get("size", "1024x1024"),
+                    }
+                    if mask_file:
+                        request_kwargs["mask"] = mask_file
+                    if "output_format" in final_config:
+                        request_kwargs["output_format"] = final_config["output_format"]
+                    if "output_compression" in final_config:
+                        request_kwargs["output_compression"] = final_config["output_compression"]
+                    response = self.client.images.edit(**request_kwargs)
                 finally:
                     if mask_file:
                         mask_file.close()
-            image_urls_list: List[str] = [img.url for img in response.data if img.url]
+            output_format = final_config.get("output_format", "png")
+            mime_type = _mime_type_from_format(output_format)
+            image_urls_list: List[str] = []
+            for img in response.data:
+                if getattr(img, "url", None):
+                    image_urls_list.append(img.url)
+                elif getattr(img, "b64_json", None):
+                    image_urls_list.append(f"data:{mime_type};base64,{img.b64_json}")
             if not image_urls_list:
-                raise ValueError("OpenAI API did not return any edited image URLs.")
+                raise ValueError("OpenAI API did not return any edited image data.")
-            logger.info(f"Successfully edited image, generated {len(image_urls_list)} version(s).")
+            logger.info("Successfully edited image, generated %s version(s).", len(image_urls_list))
             return ImageGenerationResponse(image_urls=image_urls_list)
         except FileNotFoundError as e:
-            logger.error(f"Image file not found for editing: {e.filename}")
+            logger.error("Image file not found for editing: %s", e.filename)
             raise
         except Exception as e:
-            logger.error(f"Error during OpenAI image editing: {str(e)}")
-            # The API might return a 400 Bad Request if the model doesn't support edits
+            logger.error("Error during OpenAI image editing: %s", str(e))
             if "does not support image editing" in str(e):
                 raise ValueError(f"The model '{self.model.value}' does not support the image editing endpoint.")
             raise ValueError(f"OpenAI image editing failed: {str(e)}")
+        finally:
+            if temp_image_path and temp_image_path.exists():
+                try:
+                    temp_image_path.unlink()
+                except OSError:
+                    logger.warning("Failed to clean up temp image file: %s", temp_image_path)
+            if temp_mask_path and temp_mask_path.exists():
+                try:
+                    temp_mask_path.unlink()
+                except OSError:
+                    logger.warning("Failed to clean up temp mask file: %s", temp_mask_path)
     async def cleanup(self):
         # The OpenAI client does not require explicit cleanup of a session.

autobyteus/multimedia/image/autobyteus_image_provider.py CHANGED Viewed

@@ -86,7 +86,8 @@ class AutobyteusImageModelProvider:
                             client_class=AutobyteusImageClient,
                             runtime=MultimediaRuntime.AUTOBYTEUS,
                             host_url=host_url,
-                            parameter_schema=model_info.get("parameter_schema")
+                            parameter_schema=model_info.get("parameter_schema"),
+                            description=model_info.get("description")
                         )
                         ImageClientFactory.register_model(image_model)

autobyteus/multimedia/image/image_client_factory.py CHANGED Viewed

@@ -40,43 +40,75 @@ class ImageClientFactory(metaclass=SingletonMeta):
         """Initializes the registry with built-in image models and discovers remote ones."""
         # OpenAI Models
-        gpt_image_1_schema = ParameterSchema(parameters=[
+        gpt_image_15_schema = ParameterSchema(parameters=[
             ParameterDefinition(name="n", param_type=ParameterType.INTEGER, default_value=1, enum_values=[1], description="The number of images to generate."),
             ParameterDefinition(name="size", param_type=ParameterType.ENUM, default_value="1024x1024", enum_values=["1024x1024", "1792x1024", "1024x1792"], description="The size of the generated images."),
-            ParameterDefinition(name="quality", param_type=ParameterType.ENUM, default_value="hd", enum_values=["standard", "hd"], description="The quality of the image that will be generated."),
-            ParameterDefinition(name="style", param_type=ParameterType.ENUM, default_value="vivid", enum_values=["vivid", "natural"], description="The style of the generated images.")
+            ParameterDefinition(name="quality", param_type=ParameterType.ENUM, default_value="auto", enum_values=["auto", "low", "medium", "high"], description="The quality of the image that will be generated.")
         ])
-        gpt_image_1_model = ImageModel(
-            name="gpt-image-1",
-            value="gpt-image-1",
+        gemini_image_schema = ParameterSchema(parameters=[
+            ParameterDefinition(name="n", param_type=ParameterType.INTEGER, default_value=1, enum_values=[1], description="The number of images to generate."),
+            ParameterDefinition(name="size", param_type=ParameterType.ENUM, default_value="1024x1024", enum_values=["1024x1024", "1792x1024", "1024x1792"], description="The size of the generated images."),
+            ParameterDefinition(name="quality", param_type=ParameterType.ENUM, default_value="auto", enum_values=["auto", "low", "medium", "high"], description="The quality of the image that will be generated.")
+        ])
+        gpt_image_15_model = ImageModel(
+            name="gpt-image-1.5",
+            value="gpt-image-1.5",
             provider=MultimediaProvider.OPENAI,
             client_class=OpenAIImageClient,
-            parameter_schema=gpt_image_1_schema
+            parameter_schema=gpt_image_15_schema,
+            description=(
+                "OpenAI's latest **stateless (single-turn)** image model with faster renders, improved text rendering, "
+                "and higher fidelity edits. Same API surface as gpt-image-1."
+            )
         )
         # Google Imagen Models (via Gemini API)
         imagen_model = ImageModel(
             name="imagen-4",
             value="imagen-4.0-generate-001",
-            provider=MultimediaProvider.GOOGLE,
+            provider=MultimediaProvider.GEMINI,
             client_class=GeminiImageClient,
-            parameter_schema=None # The genai library doesn't expose these as simple params
+            parameter_schema=None, # The genai library doesn't expose these as simple params
+            description=(
+                "A high-fidelity **stateless (single-turn)** model. "
+                "Does **NOT** support input images (text-to-image only). "
+                "Any provided input images will be ignored."
+            )
         )
-        # Google Gemini Flash Image Model (aka "Nano Banana")
+        # Google Gemini 2.5 Flash Image (legacy, still widely available)
         gemini_flash_image_model = ImageModel(
-            name="gemini-2.5-flash-image-preview",
-            value="gemini-2.5-flash-image-preview",
-            provider=MultimediaProvider.GOOGLE,
+            name="gemini-2.5-flash-image",
+            value="gemini-2.5-flash-image",
+            provider=MultimediaProvider.GEMINI,
+            client_class=GeminiImageClient,
+            parameter_schema=None,  # Parameters handled by genai library
+            description=(
+                "Fast **conversational (multi-turn)** multimodal image model. "
+                "Supports context retention and input images for edits/variations."
+            )
+        )
+        # Google Gemini 3 Pro Image (aka "Nano Banana Pro")
+        gemini_pro_image_model = ImageModel(
+            name="gemini-3-pro-image-preview",
+            value="gemini-3-pro-image-preview",
+            provider=MultimediaProvider.GEMINI,
             client_class=GeminiImageClient,
-            parameter_schema=None # Parameters are not exposed for this model via the genai library.
+            parameter_schema=None,  # genai library handles options internally
+            description=(
+                "High-quality **conversational (multi-turn)** image model for complex edits and 4K renders. "
+                "Supports up to 14 reference images, advanced text rendering, and thinking mode."
+            )
         )
         models_to_register = [
-            gpt_image_1_model,
+            gpt_image_15_model,
             imagen_model,
             gemini_flash_image_model,
+            gemini_pro_image_model,
         ]
         for model in models_to_register:

autobyteus/multimedia/image/image_model.py CHANGED Viewed

@@ -50,7 +50,8 @@ class ImageModel(metaclass=ImageModelMeta):
         client_class: Type["BaseImageClient"],
         parameter_schema: Optional[Union[Dict[str, Any], ParameterSchema]] = None,
         runtime: MultimediaRuntime = MultimediaRuntime.API,
-        host_url: Optional[str] = None
+        host_url: Optional[str] = None,
+        description: Optional[str] = None
     ):
         self.name = name
         self.value = value
@@ -58,6 +59,7 @@ class ImageModel(metaclass=ImageModelMeta):
         self.client_class = client_class
         self.runtime = runtime
         self.host_url = host_url
+        self.description = description
         if isinstance(parameter_schema, dict):
             self.parameter_schema = ParameterSchema.from_dict(parameter_schema)
@@ -79,7 +81,8 @@ class ImageModel(metaclass=ImageModelMeta):
         """Returns the unique identifier for the model."""
         if self.runtime == MultimediaRuntime.AUTOBYTEUS and self.host_url:
             try:
-                host = urlparse(self.host_url).hostname
+                parsed = urlparse(self.host_url)
+                host = parsed.netloc or parsed.hostname or self.host_url
                 return f"{self.name}@{host}"
             except Exception:
                 return f"{self.name}@{self.host_url}" # Fallback

autobyteus/multimedia/providers.py CHANGED Viewed

@@ -2,5 +2,6 @@ from enum import Enum
 class MultimediaProvider(Enum):
     OPENAI = "OPENAI"
-    GOOGLE = "GOOGLE"
-    ALIBABA_QWEN = "ALIBABA_QWEN"
+    GEMINI = "GEMINI"
+    QWEN = "QWEN"
+    AUTOBYTEUS = "AUTOBYTEUS"

autobyteus 1.2.1__py3-none-any.whl → 1.2.3__py3-none-any.whl

autobyteus 1.2.1py3-none-any.whl → 1.2.3py3-none-any.whl