PyPI - symbolicai - Versions diffs - 0.21.0__py3-none-any.whl → 1.1.0__py3-none-any.whl - Mend

symbolicai 0.21.0py3-none-any.whl → 1.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (134) hide show

symai/__init__.py +269 -173
symai/backend/base.py +123 -110
symai/backend/engines/drawing/engine_bfl.py +45 -44
symai/backend/engines/drawing/engine_gpt_image.py +112 -97
symai/backend/engines/embedding/engine_llama_cpp.py +63 -52
symai/backend/engines/embedding/engine_openai.py +25 -21
symai/backend/engines/execute/engine_python.py +19 -18
symai/backend/engines/files/engine_io.py +104 -95
symai/backend/engines/imagecaptioning/engine_blip2.py +28 -24
symai/backend/engines/imagecaptioning/engine_llavacpp_client.py +102 -79
symai/backend/engines/index/engine_pinecone.py +124 -97
symai/backend/engines/index/engine_qdrant.py +1011 -0
symai/backend/engines/index/engine_vectordb.py +84 -56
symai/backend/engines/lean/engine_lean4.py +96 -52
symai/backend/engines/neurosymbolic/__init__.py +41 -13
symai/backend/engines/neurosymbolic/engine_anthropic_claudeX_chat.py +330 -248
symai/backend/engines/neurosymbolic/engine_anthropic_claudeX_reasoning.py +329 -264
symai/backend/engines/neurosymbolic/engine_cerebras.py +328 -0
symai/backend/engines/neurosymbolic/engine_deepseekX_reasoning.py +118 -88
symai/backend/engines/neurosymbolic/engine_google_geminiX_reasoning.py +344 -299
symai/backend/engines/neurosymbolic/engine_groq.py +173 -115
symai/backend/engines/neurosymbolic/engine_huggingface.py +114 -84
symai/backend/engines/neurosymbolic/engine_llama_cpp.py +144 -118
symai/backend/engines/neurosymbolic/engine_openai_gptX_chat.py +415 -307
symai/backend/engines/neurosymbolic/engine_openai_gptX_reasoning.py +394 -231
symai/backend/engines/ocr/engine_apilayer.py +23 -27
symai/backend/engines/output/engine_stdout.py +10 -13
symai/backend/engines/{webscraping → scrape}/engine_requests.py +101 -54
symai/backend/engines/search/engine_openai.py +100 -88
symai/backend/engines/search/engine_parallel.py +665 -0
symai/backend/engines/search/engine_perplexity.py +44 -45
symai/backend/engines/search/engine_serpapi.py +37 -34
symai/backend/engines/speech_to_text/engine_local_whisper.py +54 -51
symai/backend/engines/symbolic/engine_wolframalpha.py +15 -9
symai/backend/engines/text_to_speech/engine_openai.py +20 -26
symai/backend/engines/text_vision/engine_clip.py +39 -37
symai/backend/engines/userinput/engine_console.py +5 -6
symai/backend/mixin/__init__.py +13 -0
symai/backend/mixin/anthropic.py +48 -38
symai/backend/mixin/deepseek.py +6 -5
symai/backend/mixin/google.py +7 -4
symai/backend/mixin/groq.py +2 -4
symai/backend/mixin/openai.py +140 -110
symai/backend/settings.py +87 -20
symai/chat.py +216 -123
symai/collect/__init__.py +7 -1
symai/collect/dynamic.py +80 -70
symai/collect/pipeline.py +67 -51
symai/collect/stats.py +161 -109
symai/components.py +707 -360
symai/constraints.py +24 -12
symai/core.py +1857 -1233
symai/core_ext.py +83 -80
symai/endpoints/api.py +166 -104
symai/extended/.DS_Store +0 -0
symai/extended/__init__.py +46 -12
symai/extended/api_builder.py +29 -21
symai/extended/arxiv_pdf_parser.py +23 -14
symai/extended/bibtex_parser.py +9 -6
symai/extended/conversation.py +156 -126
symai/extended/document.py +50 -30
symai/extended/file_merger.py +57 -14
symai/extended/graph.py +51 -32
symai/extended/html_style_template.py +18 -14
symai/extended/interfaces/blip_2.py +2 -3
symai/extended/interfaces/clip.py +4 -3
symai/extended/interfaces/console.py +9 -1
symai/extended/interfaces/dall_e.py +4 -2
symai/extended/interfaces/file.py +2 -0
symai/extended/interfaces/flux.py +4 -2
symai/extended/interfaces/gpt_image.py +16 -7
symai/extended/interfaces/input.py +2 -1
symai/extended/interfaces/llava.py +1 -2
symai/extended/interfaces/{naive_webscraping.py → naive_scrape.py} +4 -3
symai/extended/interfaces/naive_vectordb.py +9 -10
symai/extended/interfaces/ocr.py +5 -3
symai/extended/interfaces/openai_search.py +2 -0
symai/extended/interfaces/parallel.py +30 -0
symai/extended/interfaces/perplexity.py +2 -0
symai/extended/interfaces/pinecone.py +12 -9
symai/extended/interfaces/python.py +2 -0
symai/extended/interfaces/serpapi.py +3 -1
symai/extended/interfaces/terminal.py +2 -4
symai/extended/interfaces/tts.py +3 -2
symai/extended/interfaces/whisper.py +3 -2
symai/extended/interfaces/wolframalpha.py +2 -1
symai/extended/metrics/__init__.py +11 -1
symai/extended/metrics/similarity.py +14 -13
symai/extended/os_command.py +39 -29
symai/extended/packages/__init__.py +29 -3
symai/extended/packages/symdev.py +51 -43
symai/extended/packages/sympkg.py +41 -35
symai/extended/packages/symrun.py +63 -50
symai/extended/repo_cloner.py +14 -12
symai/extended/seo_query_optimizer.py +15 -13
symai/extended/solver.py +116 -91
symai/extended/summarizer.py +12 -10
symai/extended/taypan_interpreter.py +17 -18
symai/extended/vectordb.py +122 -92
symai/formatter/__init__.py +9 -1
symai/formatter/formatter.py +51 -47
symai/formatter/regex.py +70 -69
symai/functional.py +325 -176
symai/imports.py +190 -147
symai/interfaces.py +57 -28
symai/memory.py +45 -35
symai/menu/screen.py +28 -19
symai/misc/console.py +66 -56
symai/misc/loader.py +8 -5
symai/models/__init__.py +17 -1
symai/models/base.py +395 -236
symai/models/errors.py +1 -2
symai/ops/__init__.py +32 -22
symai/ops/measures.py +24 -25
symai/ops/primitives.py +1149 -731
symai/post_processors.py +58 -50
symai/pre_processors.py +86 -82
symai/processor.py +21 -13
symai/prompts.py +764 -685
symai/server/huggingface_server.py +135 -49
symai/server/llama_cpp_server.py +21 -11
symai/server/qdrant_server.py +206 -0
symai/shell.py +100 -42
symai/shellsv.py +700 -492
symai/strategy.py +630 -346
symai/symbol.py +368 -322
symai/utils.py +100 -78
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/METADATA +22 -10
symbolicai-1.1.0.dist-info/RECORD +168 -0
symbolicai-0.21.0.dist-info/RECORD +0 -162
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/WHEEL +0 -0
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/entry_points.txt +0 -0
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/licenses/LICENSE +0 -0
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/top_level.txt +0 -0

symai/backend/engines/neurosymbolic/engine_anthropic_claudeX_chat.py CHANGED Viewed

@@ -2,20 +2,22 @@ import json
 import logging
 import re
 from copy import copy, deepcopy
-from typing import List, Optional
 import anthropic
 from anthropic._types import NOT_GIVEN
-from anthropic.types import (InputJSONDelta, Message,
-                             RawContentBlockDeltaEvent,
-                             RawContentBlockStartEvent,
-                             RawContentBlockStopEvent, TextBlock, TextDelta,
-                             ToolUseBlock)
+from anthropic.types import (
+    InputJSONDelta,
+    Message,
+    RawContentBlockDeltaEvent,
+    RawContentBlockStartEvent,
+    RawContentBlockStopEvent,
+    TextBlock,
+    TextDelta,
+    ToolUseBlock,
+)
 from ....components import SelfPrompt
-from ....misc.console import ConsoleStyle
-from ....symbol import Symbol
-from ....utils import CustomUserWarning, encode_media_frames
+from ....utils import UserMessage, encode_media_frames
 from ...base import Engine
 from ...mixin.anthropic import AnthropicMixin
 from ...settings import SYMAI_CONFIG
@@ -26,6 +28,7 @@ logging.getLogger("urllib").setLevel(logging.ERROR)
 logging.getLogger("httpx").setLevel(logging.ERROR)
 logging.getLogger("httpcore").setLevel(logging.ERROR)
 class TokenizerWrapper:
     def __init__(self, compute_tokens_func):
         self.compute_tokens_func = compute_tokens_func
@@ -33,18 +36,19 @@ class TokenizerWrapper:
     def encode(self, text: str) -> int:
         return self.compute_tokens_func([{"role": "user", "content": text}])
 class ClaudeXChatEngine(Engine, AnthropicMixin):
-    def __init__(self, api_key: Optional[str] = None, model: Optional[str] = None):
+    def __init__(self, api_key: str | None = None, model: str | None = None):
         super().__init__()
         self.config = deepcopy(SYMAI_CONFIG)
         # In case we use EngineRepository.register to inject the api_key and model => dynamically change the engine at runtime
         if api_key is not None and model is not None:
-            self.config['NEUROSYMBOLIC_ENGINE_API_KEY'] = api_key
-            self.config['NEUROSYMBOLIC_ENGINE_MODEL'] = model
-        if self.id() != 'neurosymbolic':
-            return # do not initialize if not neurosymbolic; avoids conflict with llama.cpp check in EngineRepository.register_from_package
-        anthropic.api_key = self.config['NEUROSYMBOLIC_ENGINE_API_KEY']
-        self.model = self.config['NEUROSYMBOLIC_ENGINE_MODEL']
+            self.config["NEUROSYMBOLIC_ENGINE_API_KEY"] = api_key
+            self.config["NEUROSYMBOLIC_ENGINE_MODEL"] = model
+        if self.id() != "neurosymbolic":
+            return  # do not initialize if not neurosymbolic; avoids conflict with llama.cpp check in EngineRepository.register_from_package
+        anthropic.api_key = self.config["NEUROSYMBOLIC_ENGINE_API_KEY"]
+        self.model = self.config["NEUROSYMBOLIC_ENGINE_MODEL"]
         self.name = self.__class__.__name__
         self.tokenizer = TokenizerWrapper(self.compute_required_tokens)
         self.max_context_tokens = self.api_max_context_tokens()
@@ -52,95 +56,110 @@ class ClaudeXChatEngine(Engine, AnthropicMixin):
         self.client = anthropic.Anthropic(api_key=anthropic.api_key)
     def id(self) -> str:
-        if self.config.get('NEUROSYMBOLIC_ENGINE_MODEL') and \
-           self.config.get('NEUROSYMBOLIC_ENGINE_MODEL').startswith('claude') and \
-           ('3-7' not in self.config.get('NEUROSYMBOLIC_ENGINE_MODEL') and \
-            '4-0' not in self.config.get('NEUROSYMBOLIC_ENGINE_MODEL') and \
-            '4-1' not in self.config.get('NEUROSYMBOLIC_ENGINE_MODEL') and \
-            '4-5' not in self.config.get('NEUROSYMBOLIC_ENGINE_MODEL')):
-               return 'neurosymbolic'
-        return super().id() # default to unregistered
+        if (
+            self.config.get("NEUROSYMBOLIC_ENGINE_MODEL")
+            and self.config.get("NEUROSYMBOLIC_ENGINE_MODEL").startswith("claude")
+            and (
+                "3-7" not in self.config.get("NEUROSYMBOLIC_ENGINE_MODEL")
+                and "4-0" not in self.config.get("NEUROSYMBOLIC_ENGINE_MODEL")
+                and "4-1" not in self.config.get("NEUROSYMBOLIC_ENGINE_MODEL")
+                and "4-5" not in self.config.get("NEUROSYMBOLIC_ENGINE_MODEL")
+            )
+        ):
+            return "neurosymbolic"
+        return super().id()  # default to unregistered
     def command(self, *args, **kwargs):
         super().command(*args, **kwargs)
-        if 'NEUROSYMBOLIC_ENGINE_API_KEY' in kwargs:
-            anthropic.api_key = kwargs['NEUROSYMBOLIC_ENGINE_API_KEY']
-        if 'NEUROSYMBOLIC_ENGINE_MODEL' in kwargs:
-            self.model = kwargs['NEUROSYMBOLIC_ENGINE_MODEL']
+        if "NEUROSYMBOLIC_ENGINE_API_KEY" in kwargs:
+            anthropic.api_key = kwargs["NEUROSYMBOLIC_ENGINE_API_KEY"]
+        if "NEUROSYMBOLIC_ENGINE_MODEL" in kwargs:
+            self.model = kwargs["NEUROSYMBOLIC_ENGINE_MODEL"]
     def compute_required_tokens(self, messages) -> int:
+        claude_messages, system_content = self._build_claude_messages(messages)
+        if not claude_messages:
+            return 0
+        return self._count_claude_tokens(claude_messages, system_content)
+    def _build_claude_messages(self, messages):
         claude_messages = []
         system_content = None
+        for role, content_str in self._message_parts(messages):
+            if role == "system":
+                system_content = content_str
+                continue
+            if role in ["user", "assistant"]:
+                message_content = self._build_message_content(content_str)
+                if message_content:
+                    claude_messages.append(self._create_claude_message(role, message_content))
+        return claude_messages, system_content
+    def _message_parts(self, messages):
         for msg in messages:
-            if not isinstance(msg, list):
-                msg = [msg]
-            for part in msg:
-                if isinstance(part, str):
-                    role = 'user'
-                    content_str = part
-                elif isinstance(part, dict):
-                    role = part.get('role')
-                    content_str = str(part.get('content', ''))
-                else:
-                    CustomUserWarning(f"Unsupported message part type: {type(part)}", raise_with=ValueError)
-                if role == 'system':
-                    system_content = content_str
-                    continue
-                if role in ['user', 'assistant']:
-                    message_content = []
-                    image_content = self._handle_image_content(content_str)
-                    message_content.extend(image_content)
-                    text_content = self._remove_vision_pattern(content_str)
-                    if text_content:
-                        message_content.append({
-                            "type": "text",
-                            "text": text_content
-                        })
-                    if message_content:
-                        if len(message_content) == 1 and message_content[0].get('type') == 'text':
-                            claude_messages.append({
-                                'role': role,
-                                'content': message_content[0]['text']
-                            })
-                        else:
-                            claude_messages.append({
-                                'role': role,
-                                'content': message_content
-                            })
+            msg_parts = msg if isinstance(msg, list) else [msg]
+            for part in msg_parts:
+                yield self._extract_message_details(part)
-        if not claude_messages:
-            return 0
+    def _extract_message_details(self, part):
+        if isinstance(part, str):
+            return "user", part
+        if isinstance(part, dict):
+            role = part.get("role")
+            content_str = str(part.get("content", ""))
+            return role, content_str
+        msg = f"Unsupported message part type: {type(part)}"
+        UserMessage(msg, raise_with=ValueError)
+        raise ValueError(msg)
+    def _build_message_content(self, content_str: str) -> list:
+        message_content = []
+        image_content = self._handle_image_content(content_str)
+        message_content.extend(image_content)
+        text_content = self._remove_vision_pattern(content_str)
+        if text_content:
+            message_content.append({"type": "text", "text": text_content})
+        return message_content
+    def _create_claude_message(self, role: str, message_content: list) -> dict:
+        if len(message_content) == 1 and message_content[0].get("type") == "text":
+            return {"role": role, "content": message_content[0]["text"]}
+        return {"role": role, "content": message_content}
+    def _count_claude_tokens(self, claude_messages: list, system_content: str | None) -> int:
         try:
-            count_params = {
-                'model': self.model,
-                'messages': claude_messages
-            }
+            count_params = {"model": self.model, "messages": claude_messages}
             if system_content:
-                count_params['system'] = system_content
+                count_params["system"] = system_content
             count_response = self.client.messages.count_tokens(**count_params)
             return count_response.input_tokens
         except Exception as e:
-            logging.error(f"Claude count_tokens failed: {e}")
-            CustomUserWarning(f"Error counting tokens for Claude: {str(e)}", raise_with=RuntimeError)
+            UserMessage(f"Claude count_tokens failed: {e}")
+            UserMessage(f"Error counting tokens for Claude: {e!s}", raise_with=RuntimeError)
-    def compute_remaining_tokens(self, prompts: list) -> int:
-        raise NotImplementedError('Method not implemented.')
+    def compute_remaining_tokens(self, _prompts: list) -> int:
+        UserMessage("Method not implemented.", raise_with=NotImplementedError)
     def _handle_image_content(self, content: str) -> list:
         """Handle image content by processing vision patterns and returning image file data."""
         def extract_pattern(text):
-            pattern = r'<<vision:(.*?):>>'
+            pattern = r"<<vision:(.*?):>>"
             return re.findall(pattern, text)
         image_files = []
-        if '<<vision:' in content:
+        if "<<vision:" in content:
             parts = extract_pattern(content)
             for p in parts:
                 img_ = p.strip()
@@ -148,191 +167,229 @@ class ClaudeXChatEngine(Engine, AnthropicMixin):
                 max_used_frames = 10
                 buffer, ext = encode_media_frames(img_)
                 if len(buffer) > 1:
-                    step = len(buffer) // max_frames_spacing # max frames spacing
+                    step = len(buffer) // max_frames_spacing  # max frames spacing
                     frames = []
                     indices = list(range(0, len(buffer), step))[:max_used_frames]
                     for i in indices:
-                        frames.append({'data': buffer[i], 'media_type': f'image/{ext}', 'type': 'base64'})
+                        frames.append(
+                            {"data": buffer[i], "media_type": f"image/{ext}", "type": "base64"}
+                        )
                     image_files.extend(frames)
                 elif len(buffer) == 1:
-                    image_files.append({'data': buffer[0], 'media_type': f'image/{ext}', 'type': 'base64'})
+                    image_files.append(
+                        {"data": buffer[0], "media_type": f"image/{ext}", "type": "base64"}
+                    )
                 else:
-                    CustomUserWarning(f'No frames found for image!')
+                    UserMessage("No frames found for image!")
         return image_files
     def _remove_vision_pattern(self, text: str) -> str:
         """Remove vision patterns from text."""
-        pattern = r'<<vision:(.*?):>>'
-        return re.sub(pattern, '', text)
+        pattern = r"<<vision:(.*?):>>"
+        return re.sub(pattern, "", text)
     def forward(self, argument):
         kwargs = argument.kwargs
         system, messages = argument.prop.prepared_input
         payload = self._prepare_request_payload(argument)
-        except_remedy = kwargs.get('except_remedy')
+        except_remedy = kwargs.get("except_remedy")
         try:
-            res = self.client.messages.create(
-                system=system,
-                messages=messages,
-                **payload
-            )
+            res = self.client.messages.create(system=system, messages=messages, **payload)
         except Exception as e:
-            if anthropic.api_key is None or anthropic.api_key == '':
-                msg = 'Anthropic API key is not set. Please set it in the config file or pass it as an argument to the command method.'
-                logging.error(msg)
-                if self.config['NEUROSYMBOLIC_ENGINE_API_KEY'] is None or self.config['NEUROSYMBOLIC_ENGINE_API_KEY'] == '':
-                    CustomUserWarning(msg, raise_with=ValueError)
-                anthropic.api_key = self.config['NEUROSYMBOLIC_ENGINE_API_KEY']
+            if anthropic.api_key is None or anthropic.api_key == "":
+                msg = "Anthropic API key is not set. Please set it in the config file or pass it as an argument to the command method."
+                UserMessage(msg)
+                if (
+                    self.config["NEUROSYMBOLIC_ENGINE_API_KEY"] is None
+                    or self.config["NEUROSYMBOLIC_ENGINE_API_KEY"] == ""
+                ):
+                    UserMessage(msg, raise_with=ValueError)
+                anthropic.api_key = self.config["NEUROSYMBOLIC_ENGINE_API_KEY"]
             callback = self.client.messages.create
-            kwargs['model'] = kwargs['model'] if 'model' in kwargs else self.model
+            kwargs["model"] = kwargs.get("model", self.model)
             if except_remedy is not None:
                 res = except_remedy(self, e, callback, argument)
             else:
-                CustomUserWarning(f'Error during generation. Caused by: {e}', raise_with=ValueError)
+                UserMessage(f"Error during generation. Caused by: {e}", raise_with=ValueError)
-        if payload['stream']:
-            res = [_ for _ in res] # Unpack the iterator to a list
-        metadata = {'raw_output': res}
+        if payload["stream"]:
+            res = list(res)  # Unpack the iterator to a list
+        metadata = {"raw_output": res}
         response_data = self._collect_response(res)
-        if response_data.get('function_call'):
-            metadata['function_call'] = response_data['function_call']
+        if response_data.get("function_call"):
+            metadata["function_call"] = response_data["function_call"]
-        text_output = response_data.get('text', '')
+        text_output = response_data.get("text", "")
         if argument.prop.response_format:
             # Anthropic returns JSON in markdown format
-            text_output = text_output.replace('```json', '').replace('```', '')
+            text_output = text_output.replace("```json", "").replace("```", "")
         return [text_output], metadata
     def _prepare_raw_input(self, argument):
         if not argument.prop.processed_input:
-            raise ValueError('Need to provide a prompt instruction to the engine if `raw_input` is enabled!')
+            msg = "Need to provide a prompt instruction to the engine if `raw_input` is enabled!"
+            UserMessage(msg)
+            raise ValueError(msg)
         system = NOT_GIVEN
         prompt = copy(argument.prop.processed_input)
-        if type(prompt) != list:
-            if type(prompt) != dict:
-                prompt = {'role': 'user', 'content': str(prompt)}
+        if not isinstance(prompt, list):
+            if not isinstance(prompt, dict):
+                prompt = {"role": "user", "content": str(prompt)}
             prompt = [prompt]
         if len(prompt) > 1:
             # assert there are not more than 1 system instruction
-            assert len([p for p in prompt if p['role'] == 'system']) <= 1, 'Only one system instruction is allowed!'
+            assert len([p for p in prompt if p["role"] == "system"]) <= 1, (
+                "Only one system instruction is allowed!"
+            )
             for p in prompt:
-                if p['role'] == 'system':
-                    system = p['content']
+                if p["role"] == "system":
+                    system = p["content"]
                     prompt.remove(p)
                     break
         return system, prompt
     def prepare(self, argument):
-        #@NOTE: OpenAI compatibility at high level
+        # @NOTE: OpenAI compatibility at high level
         if argument.prop.raw_input:
             argument.prop.prepared_input = self._prepare_raw_input(argument)
             return
-        _non_verbose_output = """<META_INSTRUCTION/>\nYou do not output anything else, like verbose preambles or post explanation, such as "Sure, let me...", "Hope that was helpful...", "Yes, I can help you with that...", etc. Consider well formatted output, e.g. for sentences use punctuation, spaces etc. or for code use indentation, etc. Never add meta instructions information to your output!\n\n"""
-        user:   str = ""
-        system: str = ""
+        non_verbose_output = """<META_INSTRUCTION/>\nYou do not output anything else, like verbose preambles or post explanation, such as "Sure, let me...", "Hope that was helpful...", "Yes, I can help you with that...", etc. Consider well formatted output, e.g. for sentences use punctuation, spaces etc. or for code use indentation, etc. Never add meta instructions information to your output!\n\n"""
+        image_files = self._handle_image_content(str(argument.prop.processed_input))
+        has_image = len(image_files) > 0
+        system = self._build_system_prompt(argument, has_image, non_verbose_output)
+        user_text, user_prompt, image_blocks = self._build_user_prompt(argument, image_files)
+        system, user_prompt = self._apply_self_prompt_if_needed(
+            argument, system, user_text, image_blocks, user_prompt
+        )
+        argument.prop.prepared_input = (system, [user_prompt])
+    def _build_system_prompt(self, argument, has_image: bool, non_verbose_output: str) -> str:
+        system = self._build_system_prefix(argument, non_verbose_output)
+        system = self._append_context_sections(system, argument)
+        system = self._append_instruction_section(system, argument, has_image)
+        return self._append_template_suffix(system, argument)
+    def _build_system_prefix(self, argument, non_verbose_output: str) -> str:
+        system = ""
         if argument.prop.suppress_verbose_output:
-            system += _non_verbose_output
-        system = f'{system}\n' if system and len(system) > 0 else ''
+            system += non_verbose_output
+        system = f"{system}\n" if system and len(system) > 0 else ""
         if argument.prop.response_format:
-            _rsp_fmt = argument.prop.response_format
-            assert _rsp_fmt.get('type') is not None, 'Response format type is required! Expected format `{"type": str}`! The str value will be passed to the engine. Refer to the Anthropic documentation for more information: https://docs.anthropic.com/en/docs/test-and-evaluate/strengthen-guardrails/increase-consistency#example-standardizing-customer-feedback'
-            system += _non_verbose_output
-            system += f'<RESPONSE_FORMAT/>\n{_rsp_fmt["type"]}\n\n'
+            response_format = argument.prop.response_format
+            assert response_format.get("type") is not None, (
+                'Response format type is required! Expected format `{"type": str}`! The str value will be passed to the engine. Refer to the Anthropic documentation for more information: https://docs.anthropic.com/en/docs/test-and-evaluate/strengthen-guardrails/increase-consistency#example-standardizing-customer-feedback'
+            )
+            system += non_verbose_output
+            system += f"<RESPONSE_FORMAT/>\n{response_format['type']}\n\n"
+        return system
+    def _append_context_sections(self, system: str, argument) -> str:
         ref = argument.prop.instance
-        static_ctxt, dyn_ctxt = ref.global_context
-        if len(static_ctxt) > 0:
-            system += f"<STATIC_CONTEXT/>\n{static_ctxt}\n\n"
+        static_context, dynamic_context = ref.global_context
+        if len(static_context) > 0:
+            system += f"<STATIC_CONTEXT/>\n{static_context}\n\n"
-        if len(dyn_ctxt) > 0:
-            system += f"<DYNAMIC_CONTEXT/>\n{dyn_ctxt}\n\n"
+        if len(dynamic_context) > 0:
+            system += f"<DYNAMIC_CONTEXT/>\n{dynamic_context}\n\n"
         payload = argument.prop.payload
         if argument.prop.payload:
-            system += f"<ADDITIONAL_CONTEXT/>\n{str(payload)}\n\n"
+            system += f"<ADDITIONAL_CONTEXT/>\n{payload!s}\n\n"
-        examples: List[str] = argument.prop.examples
+        examples: list[str] = argument.prop.examples
         if examples and len(examples) > 0:
-            system += f"<EXAMPLES/>\n{str(examples)}\n\n"
+            system += f"<EXAMPLES/>\n{examples!s}\n\n"
-        image_files = self._handle_image_content(str(argument.prop.processed_input))
+        return system
+    def _append_instruction_section(self, system: str, argument, has_image: bool) -> str:
         if argument.prop.prompt is not None and len(argument.prop.prompt) > 0:
-            val = str(argument.prop.prompt)
-            if len(image_files) > 0:
-                val = self._remove_vision_pattern(val)
-            system += f"<INSTRUCTION/>\n{val}\n\n"
+            instruction_value = str(argument.prop.prompt)
+            if has_image:
+                instruction_value = self._remove_vision_pattern(instruction_value)
+            system += f"<INSTRUCTION/>\n{instruction_value}\n\n"
+        return system
+    def _append_template_suffix(self, system: str, argument) -> str:
+        if argument.prop.template_suffix:
+            system += f" You will only generate content for the placeholder `{argument.prop.template_suffix!s}` following the instructions and the provided context information.\n\n"
-        suffix: str = str(argument.prop.processed_input)
+        return system
+    def _build_user_prompt(self, argument, image_files):
+        suffix = str(argument.prop.processed_input)
         if len(image_files) > 0:
             suffix = self._remove_vision_pattern(suffix)
-        user += f"{suffix}"
+        user_text = f"{suffix}"
+        if not user_text:
+            user_text = "N/A"
-        if not len(user):
-            # Anthropic doesn't allow empty user prompts; force it
-            user = "N/A"
+        image_blocks = [{"type": "image", "source": image_file} for image_file in image_files]
+        user_prompt = self._wrap_user_prompt_content(user_text, image_blocks)
+        return user_text, user_prompt, image_blocks
-        if argument.prop.template_suffix:
-            system += f' You will only generate content for the placeholder `{str(argument.prop.template_suffix)}` following the instructions and the provided context information.\n\n'
+    def _wrap_user_prompt_content(self, user_text: str, image_blocks: list[dict]) -> dict:
+        if len(image_blocks) > 0:
+            return {"role": "user", "content": [*image_blocks, {"type": "text", "text": user_text}]}
-        if len(image_files) > 0:
-            images = [{ 'type': 'image', "source": im } for im in image_files]
-            user_prompt = { "role": "user", "content": [
-                *images,
-                { 'type': 'text', 'text': user }
-            ]}
-        else:
-            user_prompt = { "role": "user", "content": user }
-        # First check if the `Symbol` instance has the flag set, otherwise check if it was passed as an argument to a method
-        if argument.prop.instance._kwargs.get('self_prompt', False) or argument.prop.self_prompt:
-            self_prompter = SelfPrompt()
-            res = self_prompter({'user': user, 'system': system})
-            if res is None:
-                raise ValueError("Self-prompting failed!")
-            if len(image_files) > 0:
-                user_prompt = { "role": "user", "content": [
-                    *images,
-                    { 'type': 'text', 'text': res['user'] }
-                ]}
-            else:
-                user_prompt = { "role": "user", "content": res['user'] }
+        return {"role": "user", "content": user_text}
-            system = res['system']
+    def _apply_self_prompt_if_needed(
+        self, argument, system: str, user_text: str, image_blocks: list[dict], user_prompt: dict
+    ):
+        if not (
+            argument.prop.instance._kwargs.get("self_prompt", False) or argument.prop.self_prompt
+        ):
+            return system, user_prompt
-        argument.prop.prepared_input = (system, [user_prompt])
+        self_prompter = SelfPrompt()
+        res = self_prompter({"user": user_text, "system": system})
+        if res is None:
+            msg = "Self-prompting failed!"
+            UserMessage(msg)
+            raise ValueError(msg)
+        updated_user_prompt = self._wrap_user_prompt_content(res["user"], image_blocks)
+        return res["system"], updated_user_prompt
     def _prepare_request_payload(self, argument):
         kwargs = argument.kwargs
-        model = kwargs.get('model', self.model)
-        max_tokens = kwargs.get('max_tokens', self.max_response_tokens)
-        stop = kwargs.get('stop', NOT_GIVEN)
-        temperature = kwargs.get('temperature', 1)
-        top_p = kwargs.get('top_p', NOT_GIVEN if temperature is not None else 1) #@NOTE:'You should either alter temperature or top_p, but not both.'
-        top_k = kwargs.get('top_k', NOT_GIVEN)
-        stream = kwargs.get('stream', True) # Do NOT remove this default value! Getting tons of API errors because they can't process requests >10m
-        tools = kwargs.get('tools', NOT_GIVEN)
-        tool_choice = kwargs.get('tool_choice', NOT_GIVEN)
-        metadata_anthropic = kwargs.get('metadata', NOT_GIVEN)
-        if stop != NOT_GIVEN and type(stop) != list:
+        model = kwargs.get("model", self.model)
+        max_tokens = kwargs.get("max_tokens", self.max_response_tokens)
+        stop = kwargs.get("stop", NOT_GIVEN)
+        temperature = kwargs.get("temperature", 1)
+        top_p = kwargs.get(
+            "top_p", NOT_GIVEN if temperature is not None else 1
+        )  # @NOTE:'You should either alter temperature or top_p, but not both.'
+        top_k = kwargs.get("top_k", NOT_GIVEN)
+        stream = kwargs.get(
+            "stream", True
+        )  # Do NOT remove this default value! Getting tons of API errors because they can't process requests >10m
+        tools = kwargs.get("tools", NOT_GIVEN)
+        tool_choice = kwargs.get("tool_choice", NOT_GIVEN)
+        metadata_anthropic = kwargs.get("metadata", NOT_GIVEN)
+        if stop != NOT_GIVEN and not isinstance(stop, list):
             stop = [stop]
-        #@NOTE: Anthropic fails if stop is not raw string, so cast it to r'…'
+        # @NOTE: Anthropic fails if stop is not raw string, so cast it to r'…'
         #       E.g. when we use defaults in core.py, i.e. stop=['\n']
         if stop != NOT_GIVEN:
-            stop = [r'{s}' for s in stop]
+            stop = [r"{s}" for s in stop]
         return {
             "model": model,
@@ -344,74 +401,99 @@ class ClaudeXChatEngine(Engine, AnthropicMixin):
             "stream": stream,
             "metadata": metadata_anthropic,
             "tools": tools,
-            "tool_choice": tool_choice
+            "tool_choice": tool_choice,
         }
     def _collect_response(self, res):
         if isinstance(res, list):
-            text_content = ''
-            tool_calls_raw = []
-            active_tool_calls = {}
-            for chunk in res:
-                if isinstance(chunk, RawContentBlockStartEvent):
-                    if isinstance(chunk.content_block, ToolUseBlock):
-                        active_tool_calls[chunk.index] = {
-                            'id': chunk.content_block.id,
-                            'name': chunk.content_block.name,
-                            'input_json_str': ""
-                        }
-                elif isinstance(chunk, RawContentBlockDeltaEvent):
-                    if isinstance(chunk.delta, TextDelta):
-                        text_content += chunk.delta.text
-                    elif isinstance(chunk.delta, InputJSONDelta):
-                        if chunk.index in active_tool_calls:
-                            active_tool_calls[chunk.index]['input_json_str'] += chunk.delta.partial_json
-                elif isinstance(chunk, RawContentBlockStopEvent):
-                    if chunk.index in active_tool_calls:
-                        tool_call_info = active_tool_calls.pop(chunk.index)
-                        try:
-                            tool_call_info['input'] = json.loads(tool_call_info['input_json_str'])
-                        except json.JSONDecodeError as e:
-                            logging.error(f"Failed to parse JSON for tool call {tool_call_info['name']}: {e}. Raw JSON: '{tool_call_info['input_json_str']}'")
-                            tool_call_info['input'] = {}
-                        tool_calls_raw.append(tool_call_info)
-            function_call_data = None
-            if tool_calls_raw:
-                if len(tool_calls_raw) > 1:
-                    CustomUserWarning("Multiple tool calls detected in the stream but only the first one will be processed.")
-                function_call_data = {
-                    'name': tool_calls_raw[0]['name'],
-                    'arguments': tool_calls_raw[0]['input']
-                }
-            return {
-                "text": text_content,
-                "function_call": function_call_data
-            }
+            return self._collect_streaming_response(res)
-        # Non-streamed response (res is a Message object)
         if isinstance(res, Message):
-            text_content = ''
-            function_call_data = None
-            hit_tool_use = False
-            for content_block in res.content:
-                if isinstance(content_block, TextBlock):
-                    text_content += content_block.text
-                elif isinstance(content_block, ToolUseBlock):
-                    if hit_tool_use:
-                        CustomUserWarning("Multiple tool use blocks detected in the response but only the first one will be processed.")
-                    else:
-                        function_call_data = {
-                            'name': content_block.name,
-                            'arguments': content_block.input
-                        }
-                        hit_tool_use = True
-            return {
-                "text": text_content,
-                "function_call": function_call_data
+            return self._collect_message_response(res)
+        UserMessage(
+            f"Unexpected response type from Anthropic API: {type(res)}", raise_with=ValueError
+        )
+        return {}
+    def _collect_streaming_response(self, res):
+        text_parts = []
+        tool_calls_raw = []
+        active_tool_calls = {}
+        for chunk in res:
+            if isinstance(chunk, RawContentBlockStartEvent):
+                self._start_tool_call(chunk, active_tool_calls)
+            elif isinstance(chunk, RawContentBlockDeltaEvent):
+                self._update_stream_chunk(chunk, text_parts, active_tool_calls)
+            elif isinstance(chunk, RawContentBlockStopEvent):
+                tool_call = self._finish_tool_call(chunk, active_tool_calls)
+                if tool_call is not None:
+                    tool_calls_raw.append(tool_call)
+        text_content = "".join(text_parts)
+        function_call_data = self._build_function_call_data(tool_calls_raw)
+        return {"text": text_content, "function_call": function_call_data}
+    def _start_tool_call(self, chunk, active_tool_calls: dict):
+        if isinstance(chunk.content_block, ToolUseBlock):
+            active_tool_calls[chunk.index] = {
+                "id": chunk.content_block.id,
+                "name": chunk.content_block.name,
+                "input_json_str": "",
             }
-        CustomUserWarning(f"Unexpected response type from Anthropic API: {type(res)}", raise_with=ValueError)
+    def _update_stream_chunk(self, chunk, text_parts: list, active_tool_calls: dict):
+        if isinstance(chunk.delta, TextDelta):
+            text_parts.append(chunk.delta.text)
+        elif isinstance(chunk.delta, InputJSONDelta) and chunk.index in active_tool_calls:
+            active_tool_calls[chunk.index]["input_json_str"] += chunk.delta.partial_json
+    def _finish_tool_call(self, chunk, active_tool_calls: dict):
+        if chunk.index not in active_tool_calls:
+            return None
+        tool_call_info = active_tool_calls.pop(chunk.index)
+        try:
+            tool_call_info["input"] = json.loads(tool_call_info["input_json_str"])
+        except json.JSONDecodeError as e:
+            UserMessage(
+                f"Failed to parse JSON for tool call {tool_call_info['name']}: {e}. Raw JSON: '{tool_call_info['input_json_str']}'"
+            )
+            tool_call_info["input"] = {}
+        return tool_call_info
+    def _build_function_call_data(self, tool_calls_raw: list | None) -> dict | None:
+        if not tool_calls_raw:
+            return None
+        if len(tool_calls_raw) > 1:
+            UserMessage(
+                "Multiple tool calls detected in the stream but only the first one will be processed."
+            )
+        tool_call = tool_calls_raw[0]
+        return {"name": tool_call["name"], "arguments": tool_call["input"]}
+    def _collect_message_response(self, res: Message):
+        text_parts = []
+        function_call_data = None
+        hit_tool_use = False
+        for content_block in res.content:
+            if isinstance(content_block, TextBlock):
+                text_parts.append(content_block.text)
+            elif isinstance(content_block, ToolUseBlock):
+                if hit_tool_use:
+                    UserMessage(
+                        "Multiple tool use blocks detected in the response but only the first one will be processed."
+                    )
+                else:
+                    function_call_data = {
+                        "name": content_block.name,
+                        "arguments": content_block.input,
+                    }
+                    hit_tool_use = True
+        return {"text": "".join(text_parts), "function_call": function_call_data}

symbolicai 0.21.0__py3-none-any.whl → 1.1.0__py3-none-any.whl

symbolicai 0.21.0py3-none-any.whl → 1.1.0py3-none-any.whl