PyPI - symbolicai - Versions diffs - 0.21.0__py3-none-any.whl → 1.1.0__py3-none-any.whl - Mend

symbolicai 0.21.0py3-none-any.whl → 1.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (134) hide show

symai/__init__.py +269 -173
symai/backend/base.py +123 -110
symai/backend/engines/drawing/engine_bfl.py +45 -44
symai/backend/engines/drawing/engine_gpt_image.py +112 -97
symai/backend/engines/embedding/engine_llama_cpp.py +63 -52
symai/backend/engines/embedding/engine_openai.py +25 -21
symai/backend/engines/execute/engine_python.py +19 -18
symai/backend/engines/files/engine_io.py +104 -95
symai/backend/engines/imagecaptioning/engine_blip2.py +28 -24
symai/backend/engines/imagecaptioning/engine_llavacpp_client.py +102 -79
symai/backend/engines/index/engine_pinecone.py +124 -97
symai/backend/engines/index/engine_qdrant.py +1011 -0
symai/backend/engines/index/engine_vectordb.py +84 -56
symai/backend/engines/lean/engine_lean4.py +96 -52
symai/backend/engines/neurosymbolic/__init__.py +41 -13
symai/backend/engines/neurosymbolic/engine_anthropic_claudeX_chat.py +330 -248
symai/backend/engines/neurosymbolic/engine_anthropic_claudeX_reasoning.py +329 -264
symai/backend/engines/neurosymbolic/engine_cerebras.py +328 -0
symai/backend/engines/neurosymbolic/engine_deepseekX_reasoning.py +118 -88
symai/backend/engines/neurosymbolic/engine_google_geminiX_reasoning.py +344 -299
symai/backend/engines/neurosymbolic/engine_groq.py +173 -115
symai/backend/engines/neurosymbolic/engine_huggingface.py +114 -84
symai/backend/engines/neurosymbolic/engine_llama_cpp.py +144 -118
symai/backend/engines/neurosymbolic/engine_openai_gptX_chat.py +415 -307
symai/backend/engines/neurosymbolic/engine_openai_gptX_reasoning.py +394 -231
symai/backend/engines/ocr/engine_apilayer.py +23 -27
symai/backend/engines/output/engine_stdout.py +10 -13
symai/backend/engines/{webscraping → scrape}/engine_requests.py +101 -54
symai/backend/engines/search/engine_openai.py +100 -88
symai/backend/engines/search/engine_parallel.py +665 -0
symai/backend/engines/search/engine_perplexity.py +44 -45
symai/backend/engines/search/engine_serpapi.py +37 -34
symai/backend/engines/speech_to_text/engine_local_whisper.py +54 -51
symai/backend/engines/symbolic/engine_wolframalpha.py +15 -9
symai/backend/engines/text_to_speech/engine_openai.py +20 -26
symai/backend/engines/text_vision/engine_clip.py +39 -37
symai/backend/engines/userinput/engine_console.py +5 -6
symai/backend/mixin/__init__.py +13 -0
symai/backend/mixin/anthropic.py +48 -38
symai/backend/mixin/deepseek.py +6 -5
symai/backend/mixin/google.py +7 -4
symai/backend/mixin/groq.py +2 -4
symai/backend/mixin/openai.py +140 -110
symai/backend/settings.py +87 -20
symai/chat.py +216 -123
symai/collect/__init__.py +7 -1
symai/collect/dynamic.py +80 -70
symai/collect/pipeline.py +67 -51
symai/collect/stats.py +161 -109
symai/components.py +707 -360
symai/constraints.py +24 -12
symai/core.py +1857 -1233
symai/core_ext.py +83 -80
symai/endpoints/api.py +166 -104
symai/extended/.DS_Store +0 -0
symai/extended/__init__.py +46 -12
symai/extended/api_builder.py +29 -21
symai/extended/arxiv_pdf_parser.py +23 -14
symai/extended/bibtex_parser.py +9 -6
symai/extended/conversation.py +156 -126
symai/extended/document.py +50 -30
symai/extended/file_merger.py +57 -14
symai/extended/graph.py +51 -32
symai/extended/html_style_template.py +18 -14
symai/extended/interfaces/blip_2.py +2 -3
symai/extended/interfaces/clip.py +4 -3
symai/extended/interfaces/console.py +9 -1
symai/extended/interfaces/dall_e.py +4 -2
symai/extended/interfaces/file.py +2 -0
symai/extended/interfaces/flux.py +4 -2
symai/extended/interfaces/gpt_image.py +16 -7
symai/extended/interfaces/input.py +2 -1
symai/extended/interfaces/llava.py +1 -2
symai/extended/interfaces/{naive_webscraping.py → naive_scrape.py} +4 -3
symai/extended/interfaces/naive_vectordb.py +9 -10
symai/extended/interfaces/ocr.py +5 -3
symai/extended/interfaces/openai_search.py +2 -0
symai/extended/interfaces/parallel.py +30 -0
symai/extended/interfaces/perplexity.py +2 -0
symai/extended/interfaces/pinecone.py +12 -9
symai/extended/interfaces/python.py +2 -0
symai/extended/interfaces/serpapi.py +3 -1
symai/extended/interfaces/terminal.py +2 -4
symai/extended/interfaces/tts.py +3 -2
symai/extended/interfaces/whisper.py +3 -2
symai/extended/interfaces/wolframalpha.py +2 -1
symai/extended/metrics/__init__.py +11 -1
symai/extended/metrics/similarity.py +14 -13
symai/extended/os_command.py +39 -29
symai/extended/packages/__init__.py +29 -3
symai/extended/packages/symdev.py +51 -43
symai/extended/packages/sympkg.py +41 -35
symai/extended/packages/symrun.py +63 -50
symai/extended/repo_cloner.py +14 -12
symai/extended/seo_query_optimizer.py +15 -13
symai/extended/solver.py +116 -91
symai/extended/summarizer.py +12 -10
symai/extended/taypan_interpreter.py +17 -18
symai/extended/vectordb.py +122 -92
symai/formatter/__init__.py +9 -1
symai/formatter/formatter.py +51 -47
symai/formatter/regex.py +70 -69
symai/functional.py +325 -176
symai/imports.py +190 -147
symai/interfaces.py +57 -28
symai/memory.py +45 -35
symai/menu/screen.py +28 -19
symai/misc/console.py +66 -56
symai/misc/loader.py +8 -5
symai/models/__init__.py +17 -1
symai/models/base.py +395 -236
symai/models/errors.py +1 -2
symai/ops/__init__.py +32 -22
symai/ops/measures.py +24 -25
symai/ops/primitives.py +1149 -731
symai/post_processors.py +58 -50
symai/pre_processors.py +86 -82
symai/processor.py +21 -13
symai/prompts.py +764 -685
symai/server/huggingface_server.py +135 -49
symai/server/llama_cpp_server.py +21 -11
symai/server/qdrant_server.py +206 -0
symai/shell.py +100 -42
symai/shellsv.py +700 -492
symai/strategy.py +630 -346
symai/symbol.py +368 -322
symai/utils.py +100 -78
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/METADATA +22 -10
symbolicai-1.1.0.dist-info/RECORD +168 -0
symbolicai-0.21.0.dist-info/RECORD +0 -162
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/WHEEL +0 -0
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/entry_points.txt +0 -0
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/licenses/LICENSE +0 -0
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/top_level.txt +0 -0

symai/backend/engines/neurosymbolic/engine_anthropic_claudeX_reasoning.py CHANGED Viewed

@@ -2,20 +2,24 @@ import json
 import logging
 import re
 from copy import copy, deepcopy
-from typing import List, Optional
 import anthropic
 from anthropic._types import NOT_GIVEN
-from anthropic.types import (InputJSONDelta, Message,
-                             RawContentBlockDeltaEvent,
-                             RawContentBlockStartEvent,
-                             RawContentBlockStopEvent, TextBlock, TextDelta,
-                             ThinkingBlock, ThinkingDelta, ToolUseBlock)
+from anthropic.types import (
+    InputJSONDelta,
+    Message,
+    RawContentBlockDeltaEvent,
+    RawContentBlockStartEvent,
+    RawContentBlockStopEvent,
+    TextBlock,
+    TextDelta,
+    ThinkingBlock,
+    ThinkingDelta,
+    ToolUseBlock,
+)
 from ....components import SelfPrompt
-from ....misc.console import ConsoleStyle
-from ....symbol import Symbol
-from ....utils import CustomUserWarning, encode_media_frames
+from ....utils import UserMessage, encode_media_frames
 from ...base import Engine
 from ...mixin.anthropic import AnthropicMixin
 from ...settings import SYMAI_CONFIG
@@ -34,18 +38,19 @@ class TokenizerWrapper:
     def encode(self, text: str) -> int:
         return self.compute_tokens_func([{"role": "user", "content": text}])
 class ClaudeXReasoningEngine(Engine, AnthropicMixin):
-    def __init__(self, api_key: Optional[str] = None, model: Optional[str] = None):
+    def __init__(self, api_key: str | None = None, model: str | None = None):
         super().__init__()
         self.config = deepcopy(SYMAI_CONFIG)
         # In case we use EngineRepository.register to inject the api_key and model => dynamically change the engine at runtime
         if api_key is not None and model is not None:
-            self.config['NEUROSYMBOLIC_ENGINE_API_KEY'] = api_key
-            self.config['NEUROSYMBOLIC_ENGINE_MODEL'] = model
-        if self.id() != 'neurosymbolic':
-            return # do not initialize if not neurosymbolic; avoids conflict with llama.cpp check in EngineRepository.register_from_package
-        anthropic.api_key = self.config['NEUROSYMBOLIC_ENGINE_API_KEY']
-        self.model = self.config['NEUROSYMBOLIC_ENGINE_MODEL']
+            self.config["NEUROSYMBOLIC_ENGINE_API_KEY"] = api_key
+            self.config["NEUROSYMBOLIC_ENGINE_MODEL"] = model
+        if self.id() != "neurosymbolic":
+            return  # do not initialize if not neurosymbolic; avoids conflict with llama.cpp check in EngineRepository.register_from_package
+        anthropic.api_key = self.config["NEUROSYMBOLIC_ENGINE_API_KEY"]
+        self.model = self.config["NEUROSYMBOLIC_ENGINE_MODEL"]
         self.name = self.__class__.__name__
         self.tokenizer = TokenizerWrapper(self.compute_required_tokens)
         self.max_context_tokens = self.api_max_context_tokens()
@@ -53,95 +58,99 @@ class ClaudeXReasoningEngine(Engine, AnthropicMixin):
         self.client = anthropic.Anthropic(api_key=anthropic.api_key)
     def id(self) -> str:
-        if self.config.get('NEUROSYMBOLIC_ENGINE_MODEL') and \
-           self.config.get('NEUROSYMBOLIC_ENGINE_MODEL').startswith('claude') and \
-           ('3-7' in self.config.get('NEUROSYMBOLIC_ENGINE_MODEL') or \
-            '4-0' in self.config.get('NEUROSYMBOLIC_ENGINE_MODEL') or \
-            '4-1' in self.config.get('NEUROSYMBOLIC_ENGINE_MODEL') or \
-            '4-5' in self.config.get('NEUROSYMBOLIC_ENGINE_MODEL')):
-               return 'neurosymbolic'
-        return super().id() # default to unregistered
+        if (
+            self.config.get("NEUROSYMBOLIC_ENGINE_MODEL")
+            and self.config.get("NEUROSYMBOLIC_ENGINE_MODEL").startswith("claude")
+            and (
+                "3-7" in self.config.get("NEUROSYMBOLIC_ENGINE_MODEL")
+                or "4-0" in self.config.get("NEUROSYMBOLIC_ENGINE_MODEL")
+                or "4-1" in self.config.get("NEUROSYMBOLIC_ENGINE_MODEL")
+                or "4-5" in self.config.get("NEUROSYMBOLIC_ENGINE_MODEL")
+            )
+        ):
+            return "neurosymbolic"
+        return super().id()  # default to unregistered
     def command(self, *args, **kwargs):
         super().command(*args, **kwargs)
-        if 'NEUROSYMBOLIC_ENGINE_API_KEY' in kwargs:
-            anthropic.api_key = kwargs['NEUROSYMBOLIC_ENGINE_API_KEY']
-        if 'NEUROSYMBOLIC_ENGINE_MODEL' in kwargs:
-            self.model = kwargs['NEUROSYMBOLIC_ENGINE_MODEL']
+        if "NEUROSYMBOLIC_ENGINE_API_KEY" in kwargs:
+            anthropic.api_key = kwargs["NEUROSYMBOLIC_ENGINE_API_KEY"]
+        if "NEUROSYMBOLIC_ENGINE_MODEL" in kwargs:
+            self.model = kwargs["NEUROSYMBOLIC_ENGINE_MODEL"]
     def compute_required_tokens(self, messages) -> int:
-        claude_messages = []
-        system_content = None
-        for msg in messages:
-            if not isinstance(msg, list):
-                msg = [msg]
-            for part in msg:
-                if isinstance(part, str):
-                    role = 'user'
-                    content_str = part
-                elif isinstance(part, dict):
-                    role = part.get('role')
-                    content_str = str(part.get('content', ''))
-                else:
-                    CustomUserWarning(f"Unsupported message part type: {type(part)}", raise_with=ValueError)
-                if role == 'system':
-                    system_content = content_str
-                    continue
-                if role in ['user', 'assistant']:
-                    message_content = []
-                    image_content = self._handle_image_content(content_str)
-                    message_content.extend(image_content)
-                    text_content = self._remove_vision_pattern(content_str)
-                    if text_content:
-                        message_content.append({
-                            "type": "text",
-                            "text": text_content
-                        })
-                    if message_content:
-                        if len(message_content) == 1 and message_content[0].get('type') == 'text':
-                            claude_messages.append({
-                                'role': role,
-                                'content': message_content[0]['text']
-                            })
-                        else:
-                            claude_messages.append({
-                                'role': role,
-                                'content': message_content
-                            })
+        claude_messages, system_content = self._normalize_messages_for_claude(messages)
         if not claude_messages:
             return 0
         try:
-            count_params = {
-                'model': self.model,
-                'messages': claude_messages
-            }
+            count_params = {"model": self.model, "messages": claude_messages}
             if system_content:
-                count_params['system'] = system_content
+                count_params["system"] = system_content
             count_response = self.client.messages.count_tokens(**count_params)
             return count_response.input_tokens
         except Exception as e:
-            logging.error(f"Claude count_tokens failed: {e}")
-            CustomUserWarning(f"Error counting tokens for Claude: {str(e)}", raise_with=RuntimeError)
+            UserMessage(f"Claude count_tokens failed: {e}")
+            UserMessage(f"Error counting tokens for Claude: {e!s}", raise_with=RuntimeError)
+    def _normalize_messages_for_claude(self, messages):
+        claude_messages = []
+        system_content = None
+        for msg in messages:
+            msg_parts = msg if isinstance(msg, list) else [msg]
+            for part in msg_parts:
+                role, content_str = self._extract_role_and_content(part)
+                if role == "system":
+                    system_content = content_str
+                    continue
+                if role in ["user", "assistant"]:
+                    message_payload = self._build_message_payload(role, content_str)
+                    if message_payload:
+                        claude_messages.append(message_payload)
-    def compute_remaining_tokens(self, prompts: list) -> int:
-        CustomUserWarning('Method not implemented.', raise_with=NotImplementedError)
+        return claude_messages, system_content
+    def _extract_role_and_content(self, part):
+        if isinstance(part, str):
+            return "user", part
+        if isinstance(part, dict):
+            return part.get("role"), str(part.get("content", ""))
+        UserMessage(f"Unsupported message part type: {type(part)}", raise_with=ValueError)
+        return None, ""
+    def _build_message_payload(self, role, content_str):
+        message_content = []
+        image_content = self._handle_image_content(content_str)
+        message_content.extend(image_content)
+        text_content = self._remove_vision_pattern(content_str)
+        if text_content:
+            message_content.append({"type": "text", "text": text_content})
+        if not message_content:
+            return None
+        if len(message_content) == 1 and message_content[0].get("type") == "text":
+            return {"role": role, "content": message_content[0]["text"]}
+        return {"role": role, "content": message_content}
+    def compute_remaining_tokens(self, _prompts: list) -> int:
+        UserMessage("Method not implemented.", raise_with=NotImplementedError)
     def _handle_image_content(self, content: str) -> list:
         """Handle image content by processing vision patterns and returning image file data."""
         def extract_pattern(text):
-            pattern = r'<<vision:(.*?):>>'
+            pattern = r"<<vision:(.*?):>>"
             return re.findall(pattern, text)
         image_files = []
-        if '<<vision:' in content:
+        if "<<vision:" in content:
             parts = extract_pattern(content)
             for p in parts:
                 img_ = p.strip()
@@ -149,108 +158,131 @@ class ClaudeXReasoningEngine(Engine, AnthropicMixin):
                 max_used_frames = 10
                 buffer, ext = encode_media_frames(img_)
                 if len(buffer) > 1:
-                    step = len(buffer) // max_frames_spacing # max frames spacing
+                    step = len(buffer) // max_frames_spacing  # max frames spacing
                     frames = []
                     indices = list(range(0, len(buffer), step))[:max_used_frames]
                     for i in indices:
-                        frames.append({'data': buffer[i], 'media_type': f'image/{ext}', 'type': 'base64'})
+                        frames.append(
+                            {"data": buffer[i], "media_type": f"image/{ext}", "type": "base64"}
+                        )
                     image_files.extend(frames)
                 elif len(buffer) == 1:
-                    image_files.append({'data': buffer[0], 'media_type': f'image/{ext}', 'type': 'base64'})
+                    image_files.append(
+                        {"data": buffer[0], "media_type": f"image/{ext}", "type": "base64"}
+                    )
                 else:
-                    CustomUserWarning(f'No frames found for image!')
+                    UserMessage("No frames found for image!")
         return image_files
     def _remove_vision_pattern(self, text: str) -> str:
         """Remove vision patterns from text."""
-        pattern = r'<<vision:(.*?):>>'
-        return re.sub(pattern, '', text)
+        pattern = r"<<vision:(.*?):>>"
+        return re.sub(pattern, "", text)
     def forward(self, argument):
         kwargs = argument.kwargs
         system, messages = argument.prop.prepared_input
         payload = self._prepare_request_payload(argument)
-        except_remedy = kwargs.get('except_remedy')
+        except_remedy = kwargs.get("except_remedy")
         try:
-            res = self.client.messages.create(
-                system=system,
-                messages=messages,
-                **payload
-            )
+            res = self.client.messages.create(system=system, messages=messages, **payload)
         except Exception as e:
-            if anthropic.api_key is None or anthropic.api_key == '':
-                msg = 'Anthropic API key is not set. Please set it in the config file or pass it as an argument to the command method.'
-                logging.error(msg)
-                if self.config['NEUROSYMBOLIC_ENGINE_API_KEY'] is None or self.config['NEUROSYMBOLIC_ENGINE_API_KEY'] == '':
-                    CustomUserWarning(msg, raise_with=ValueError)
-                anthropic.api_key = self.config['NEUROSYMBOLIC_ENGINE_API_KEY']
+            if anthropic.api_key is None or anthropic.api_key == "":
+                msg = "Anthropic API key is not set. Please set it in the config file or pass it as an argument to the command method."
+                UserMessage(msg)
+                if (
+                    self.config["NEUROSYMBOLIC_ENGINE_API_KEY"] is None
+                    or self.config["NEUROSYMBOLIC_ENGINE_API_KEY"] == ""
+                ):
+                    UserMessage(msg, raise_with=ValueError)
+                anthropic.api_key = self.config["NEUROSYMBOLIC_ENGINE_API_KEY"]
             callback = self.client.messages.create
-            kwargs['model'] = kwargs['model'] if 'model' in kwargs else self.model
+            kwargs["model"] = kwargs.get("model", self.model)
             if except_remedy is not None:
                 res = except_remedy(self, e, callback, argument)
             else:
-                CustomUserWarning(f'Error during generation. Caused by: {e}', raise_with=ValueError)
+                UserMessage(f"Error during generation. Caused by: {e}", raise_with=ValueError)
-        if payload['stream']:
-            res = [_ for _ in res] # Unpack the iterator to a list
-        metadata = {'raw_output': res}
+        if payload["stream"]:
+            res = list(res)  # Unpack the iterator to a list
+        metadata = {"raw_output": res}
         response_data = self._collect_response(res)
-        if response_data.get('function_call'):
-            metadata['function_call'] = response_data['function_call']
+        if response_data.get("function_call"):
+            metadata["function_call"] = response_data["function_call"]
-        if response_data.get('thinking') and len(response_data['thinking']) > 0:
-            metadata['thinking'] = response_data['thinking']
+        if response_data.get("thinking") and len(response_data["thinking"]) > 0:
+            metadata["thinking"] = response_data["thinking"]
-        text_output = response_data.get('text', '')
+        text_output = response_data.get("text", "")
         if argument.prop.response_format:
             # Anthropic returns JSON in markdown format
-            text_output = text_output.replace('```json', '').replace('```', '')
+            text_output = text_output.replace("```json", "").replace("```", "")
         return [text_output], metadata
     def _prepare_raw_input(self, argument):
         if not argument.prop.processed_input:
-            raise ValueError('Need to provide a prompt instruction to the engine if `raw_input` is enabled!')
+            msg = "Need to provide a prompt instruction to the engine if `raw_input` is enabled!"
+            UserMessage(msg)
+            raise ValueError(msg)
         system = NOT_GIVEN
         prompt = copy(argument.prop.processed_input)
-        if type(prompt) != list:
-            if type(prompt) != dict:
-                prompt = {'role': 'user', 'content': str(prompt)}
+        if not isinstance(prompt, list):
+            if not isinstance(prompt, dict):
+                prompt = {"role": "user", "content": str(prompt)}
             prompt = [prompt]
         if len(prompt) > 1:
             # assert there are not more than 1 system instruction
-            assert len([p for p in prompt if p['role'] == 'system']) <= 1, 'Only one system instruction is allowed!'
+            assert len([p for p in prompt if p["role"] == "system"]) <= 1, (
+                "Only one system instruction is allowed!"
+            )
             for p in prompt:
-                if p['role'] == 'system':
-                    system = p['content']
+                if p["role"] == "system":
+                    system = p["content"]
                     prompt.remove(p)
                     break
         return system, prompt
     def prepare(self, argument):
-        #@NOTE: OpenAI compatibility at high level
+        # @NOTE: OpenAI compatibility at high level
         if argument.prop.raw_input:
             argument.prop.prepared_input = self._prepare_raw_input(argument)
             return
         _non_verbose_output = """<META_INSTRUCTION/>\nYou do not output anything else, like verbose preambles or post explanation, such as "Sure, let me...", "Hope that was helpful...", "Yes, I can help you with that...", etc. Consider well formatted output, e.g. for sentences use punctuation, spaces etc. or for code use indentation, etc. Never add meta instructions information to your output!\n\n"""
-        user:   str = ""
-        system: str = ""
+        image_files = self._handle_image_content(str(argument.prop.processed_input))
+        system = self._build_system_prompt(argument, _non_verbose_output, image_files)
+        user_text = self._build_user_text(argument, image_files)
+        if not user_text:
+            # Anthropic doesn't allow empty user prompts; force it
+            user_text = "N/A"
+        system, user_prompt = self._apply_self_prompt_if_needed(
+            argument, system, user_text, image_files
+        )
+        argument.prop.prepared_input = (system, [user_prompt])
+    def _build_system_prompt(self, argument, non_verbose_output, image_files):
+        system = ""
         if argument.prop.suppress_verbose_output:
-            system += _non_verbose_output
-        system = f'{system}\n' if system and len(system) > 0 else ''
+            system = f"{non_verbose_output}\n"
         if argument.prop.response_format:
-            _rsp_fmt = argument.prop.response_format
-            if not (_rsp_fmt.get('type') is not None):
-                CustomUserWarning('Response format type is required! Expected format `{"type": "json_object"}` or other supported types. Refer to Anthropic documentation for details.', raise_with=AssertionError)
-            system += _non_verbose_output
-            system += f'<RESPONSE_FORMAT/>\n{_rsp_fmt["type"]}\n\n'
+            response_format = argument.prop.response_format
+            if not (response_format.get("type") is not None):
+                UserMessage(
+                    'Response format type is required! Expected format `{"type": "json_object"}` or other supported types. Refer to Anthropic documentation for details.',
+                    raise_with=AssertionError,
+                )
+            system += non_verbose_output
+            system += f"<RESPONSE_FORMAT/>\n{response_format['type']}\n\n"
         ref = argument.prop.instance
         static_ctxt, dyn_ctxt = ref.global_context
@@ -261,94 +293,89 @@ class ClaudeXReasoningEngine(Engine, AnthropicMixin):
             system += f"<DYNAMIC_CONTEXT/>\n{dyn_ctxt}\n\n"
         payload = argument.prop.payload
-        if argument.prop.payload:
-            system += f"<ADDITIONAL_CONTEXT/>\n{str(payload)}\n\n"
+        if payload:
+            system += f"<ADDITIONAL_CONTEXT/>\n{payload!s}\n\n"
-        examples: List[str] = argument.prop.examples
+        examples: list[str] = argument.prop.examples
         if examples and len(examples) > 0:
-            system += f"<EXAMPLES/>\n{str(examples)}\n\n"
-        image_files = self._handle_image_content(str(argument.prop.processed_input))
+            system += f"<EXAMPLES/>\n{examples!s}\n\n"
         if argument.prop.prompt is not None and len(argument.prop.prompt) > 0:
-            val = str(argument.prop.prompt)
+            value = str(argument.prop.prompt)
             if len(image_files) > 0:
-                val = self._remove_vision_pattern(val)
-            system += f"<INSTRUCTION/>\n{val}\n\n"
+                value = self._remove_vision_pattern(value)
+            system += f"<INSTRUCTION/>\n{value}\n\n"
+        return self._append_template_suffix(system, argument.prop.template_suffix)
-        suffix: str = str(argument.prop.processed_input)
+    def _build_user_text(self, argument, image_files):
+        suffix = str(argument.prop.processed_input)
         if len(image_files) > 0:
             suffix = self._remove_vision_pattern(suffix)
+        return suffix
-        user += f"{suffix}"
+    def _append_template_suffix(self, system, template_suffix):
+        if template_suffix:
+            return system + (
+                f" You will only generate content for the placeholder `{template_suffix!s}` "
+                "following the instructions and the provided context information.\n\n"
+            )
+        return system
-        if not len(user):
-            # Anthropic doesn't allow empty user prompts; force it
-            user = "N/A"
+    def _apply_self_prompt_if_needed(self, argument, system, user_text, image_files):
+        if not self._is_self_prompt_enabled(argument):
+            return system, self._format_user_prompt(user_text, image_files)
-        if argument.prop.template_suffix:
-            system += f' You will only generate content for the placeholder `{str(argument.prop.template_suffix)}` following the instructions and the provided context information.\n\n'
+        self_prompter = SelfPrompt()
+        response = self_prompter(
+            {"user": user_text, "system": system},
+            max_tokens=argument.kwargs.get("max_tokens", self.max_response_tokens),
+            thinking=argument.kwargs.get("thinking", NOT_GIVEN),
+        )
+        if response is None:
+            UserMessage("Self-prompting failed to return a response.", raise_with=ValueError)
-        if len(image_files) > 0:
-            images = [{ 'type': 'image', "source": im } for im in image_files]
-            user_prompt = { "role": "user", "content": [
-                *images,
-                { 'type': 'text', 'text': user }
-            ]}
-        else:
-            user_prompt = { "role": "user", "content": user }
-        # First check if the `Symbol` instance has the flag set, otherwise check if it was passed as an argument to a method
-        if argument.prop.instance._kwargs.get('self_prompt', False) or argument.prop.self_prompt:
-            self_prompter = SelfPrompt()
-            res = self_prompter(
-                {'user': user, 'system': system},
-                max_tokens=argument.kwargs.get('max_tokens', self.max_response_tokens),
-                thinking=argument.kwargs.get('thinking', NOT_GIVEN),
-            )
-            if res is None:
-                CustomUserWarning("Self-prompting failed to return a response.", raise_with=ValueError)
+        updated_prompt = self._format_user_prompt(response["user"], image_files)
+        return response["system"], updated_prompt
-            if len(image_files) > 0:
-                user_prompt = { "role": "user", "content": [
-                    *images,
-                    { 'type': 'text', 'text': res['user'] }
-                ]}
-            else:
-                user_prompt = { "role": "user", "content": res['user'] }
+    def _is_self_prompt_enabled(self, argument):
+        return argument.prop.instance._kwargs.get("self_prompt", False) or argument.prop.self_prompt
-            system = res['system']
+    def _format_user_prompt(self, user_text, image_files):
+        if len(image_files) > 0:
+            images = [{"type": "image", "source": im} for im in image_files]
+            return {"role": "user", "content": [*images, {"type": "text", "text": user_text}]}
-        argument.prop.prepared_input = (system, [user_prompt])
+        return {"role": "user", "content": user_text}
     def _prepare_request_payload(self, argument):
         kwargs = argument.kwargs
-        model = kwargs.get('model', self.model)
-        stop = kwargs.get('stop', NOT_GIVEN)
-        temperature = kwargs.get('temperature', 1)
-        thinking_arg = kwargs.get('thinking', NOT_GIVEN)
+        model = kwargs.get("model", self.model)
+        stop = kwargs.get("stop", NOT_GIVEN)
+        temperature = kwargs.get("temperature", 1)
+        thinking_arg = kwargs.get("thinking", NOT_GIVEN)
         thinking = NOT_GIVEN
         if thinking_arg and isinstance(thinking_arg, dict):
-            thinking = {
-                "type": "enabled",
-                "budget_tokens": thinking_arg.get("budget_tokens", 1024)
-            }
-        top_p = kwargs.get('top_p', NOT_GIVEN if temperature is not None else 1) #@NOTE:'You should either alter temperature or top_p, but not both.'
-        top_k = kwargs.get('top_k', NOT_GIVEN)
-        stream = kwargs.get('stream', True) # Do NOT remove this default value! Getting tons of API errors because they can't process requests >10m
-        tools = kwargs.get('tools', NOT_GIVEN)
-        tool_choice = kwargs.get('tool_choice', NOT_GIVEN)
-        metadata_anthropic = kwargs.get('metadata', NOT_GIVEN)
-        max_tokens = kwargs.get('max_tokens', self.max_response_tokens)
-        if stop != NOT_GIVEN and type(stop) != list:
+            thinking = {"type": "enabled", "budget_tokens": thinking_arg.get("budget_tokens", 1024)}
+        top_p = kwargs.get(
+            "top_p", NOT_GIVEN if temperature is not None else 1
+        )  # @NOTE:'You should either alter temperature or top_p, but not both.'
+        top_k = kwargs.get("top_k", NOT_GIVEN)
+        stream = kwargs.get(
+            "stream", True
+        )  # Do NOT remove this default value! Getting tons of API errors because they can't process requests >10m
+        tools = kwargs.get("tools", NOT_GIVEN)
+        tool_choice = kwargs.get("tool_choice", NOT_GIVEN)
+        metadata_anthropic = kwargs.get("metadata", NOT_GIVEN)
+        max_tokens = kwargs.get("max_tokens", self.max_response_tokens)
+        if stop != NOT_GIVEN and not isinstance(stop, list):
             stop = [stop]
-        #@NOTE: Anthropic fails if stop is not raw string, so cast it to r'…'
+        # @NOTE: Anthropic fails if stop is not raw string, so cast it to r'…'
         #       E.g. when we use defaults in core.py, i.e. stop=['\n']
         if stop != NOT_GIVEN:
-            stop = [r'{s}' for s in stop]
+            stop = [r"{s}" for s in stop]
         return {
             "model": model,
@@ -361,82 +388,120 @@ class ClaudeXReasoningEngine(Engine, AnthropicMixin):
             "stream": stream,
             "metadata": metadata_anthropic,
             "tools": tools,
-            "tool_choice": tool_choice
+            "tool_choice": tool_choice,
         }
     def _collect_response(self, res):
         if isinstance(res, list):
-            thinking_content = ''
-            text_content = ''
-            tool_calls_raw = []
-            active_tool_calls = {}
-            for chunk in res:
-                if isinstance(chunk, RawContentBlockStartEvent):
-                    if isinstance(chunk.content_block, ToolUseBlock):
-                        active_tool_calls[chunk.index] = {
-                            'id': chunk.content_block.id,
-                            'name': chunk.content_block.name,
-                            'input_json_str': ""
-                        }
-                elif isinstance(chunk, RawContentBlockDeltaEvent):
-                    if isinstance(chunk.delta, ThinkingDelta):
-                        thinking_content += chunk.delta.thinking
-                    elif isinstance(chunk.delta, TextDelta):
-                        text_content += chunk.delta.text
-                    elif isinstance(chunk.delta, InputJSONDelta):
-                        if chunk.index in active_tool_calls:
-                            active_tool_calls[chunk.index]['input_json_str'] += chunk.delta.partial_json
-                elif isinstance(chunk, RawContentBlockStopEvent):
-                    if chunk.index in active_tool_calls:
-                        tool_call_info = active_tool_calls.pop(chunk.index)
-                        try:
-                            tool_call_info['input'] = json.loads(tool_call_info['input_json_str'])
-                        except json.JSONDecodeError as e:
-                            logging.error(f"Failed to parse JSON for tool call {tool_call_info['name']}: {e}. Raw JSON: '{tool_call_info['input_json_str']}'")
-                            tool_call_info['input'] = {}
-                        tool_calls_raw.append(tool_call_info)
-            function_call_data = None
-            if tool_calls_raw:
-                if len(tool_calls_raw) > 1:
-                    CustomUserWarning("Multiple tool calls detected in the stream but only the first one will be processed.")
-                function_call_data = {
-                    'name': tool_calls_raw[0]['name'],
-                    'arguments': tool_calls_raw[0]['input']
-                }
-            return {
-                "thinking": thinking_content,
-                "text": text_content,
-                "function_call": function_call_data
-            }
+            return self._collect_stream_response(res)
-        # Non-streamed response (res is a Message object)
         if isinstance(res, Message):
-            thinking_content = ''
-            text_content = ''
-            function_call_data = None
-            hit = False
-            for content_block in res.content:
-                if isinstance(content_block, ThinkingBlock):
-                    thinking_content += content_block.thinking
-                elif isinstance(content_block, TextBlock):
-                    text_content += content_block.text
-                elif isinstance(content_block, ToolUseBlock):
-                    if hit:
-                        CustomUserWarning("Multiple tool use blocks detected in the response but only the first one will be processed.")
-                    else:
-                        function_call_data = {
-                            'name': content_block.name,
-                            'arguments': content_block.input
-                        }
-                        hit = True
-            return {
-                "thinking": thinking_content,
-                "text": text_content,
-                "function_call": function_call_data
+            return self._collect_message_response(res)
+        UserMessage(
+            f"Unexpected response type from Anthropic API: {type(res)}", raise_with=ValueError
+        )
+        return {}
+    def _collect_stream_response(self, response_chunks):
+        accumulators = {"thinking": "", "text": ""}
+        tool_calls_raw = []
+        active_tool_calls = {}
+        for chunk in response_chunks:
+            self._process_stream_chunk(chunk, accumulators, active_tool_calls, tool_calls_raw)
+        function_call_data = self._extract_function_call(tool_calls_raw)
+        return {
+            "thinking": accumulators["thinking"],
+            "text": accumulators["text"],
+            "function_call": function_call_data,
+        }
+    def _process_stream_chunk(self, chunk, accumulators, active_tool_calls, tool_calls_raw):
+        if isinstance(chunk, RawContentBlockStartEvent):
+            self._register_tool_call(chunk, active_tool_calls)
+        elif isinstance(chunk, RawContentBlockDeltaEvent):
+            self._handle_delta_chunk(chunk, accumulators, active_tool_calls)
+        elif isinstance(chunk, RawContentBlockStopEvent):
+            self._finalize_tool_call(chunk, active_tool_calls, tool_calls_raw)
+    def _register_tool_call(self, chunk, active_tool_calls):
+        if isinstance(chunk.content_block, ToolUseBlock):
+            active_tool_calls[chunk.index] = {
+                "id": chunk.content_block.id,
+                "name": chunk.content_block.name,
+                "input_json_str": "",
             }
-        CustomUserWarning(f"Unexpected response type from Anthropic API: {type(res)}", raise_with=ValueError)
+    def _handle_delta_chunk(self, chunk, accumulators, active_tool_calls):
+        if isinstance(chunk.delta, ThinkingDelta):
+            accumulators["thinking"] += chunk.delta.thinking
+        elif isinstance(chunk.delta, TextDelta):
+            accumulators["text"] += chunk.delta.text
+        elif isinstance(chunk.delta, InputJSONDelta) and chunk.index in active_tool_calls:
+            active_tool_calls[chunk.index]["input_json_str"] += chunk.delta.partial_json
+    def _finalize_tool_call(self, chunk, active_tool_calls, tool_calls_raw):
+        if chunk.index not in active_tool_calls:
+            return
+        tool_call_info = active_tool_calls.pop(chunk.index)
+        try:
+            tool_call_info["input"] = json.loads(tool_call_info["input_json_str"])
+        except json.JSONDecodeError as error:
+            UserMessage(
+                f"Failed to parse JSON for tool call {tool_call_info['name']}: {error}. Raw JSON: '{tool_call_info['input_json_str']}'"
+            )
+            tool_call_info["input"] = {}
+        tool_calls_raw.append(tool_call_info)
+    def _extract_function_call(self, tool_calls_raw):
+        if not tool_calls_raw:
+            return None
+        if len(tool_calls_raw) > 1:
+            UserMessage(
+                "Multiple tool calls detected in the stream but only the first one will be processed."
+            )
+        first_call = tool_calls_raw[0]
+        return {"name": first_call["name"], "arguments": first_call["input"]}
+    def _collect_message_response(self, message):
+        accumulators = {"thinking": "", "text": ""}
+        function_call_data = None
+        tool_call_detected = False
+        for content_block in message.content:
+            function_call_data, tool_call_detected = self._process_message_block(
+                content_block, accumulators, function_call_data, tool_call_detected
+            )
+        return {
+            "thinking": accumulators["thinking"],
+            "text": accumulators["text"],
+            "function_call": function_call_data,
+        }
+    def _process_message_block(
+        self, content_block, accumulators, function_call_data, tool_call_detected
+    ):
+        if isinstance(content_block, ThinkingBlock):
+            accumulators["thinking"] += content_block.thinking
+            return function_call_data, tool_call_detected
+        if isinstance(content_block, TextBlock):
+            accumulators["text"] += content_block.text
+            return function_call_data, tool_call_detected
+        if isinstance(content_block, ToolUseBlock):
+            if tool_call_detected:
+                UserMessage(
+                    "Multiple tool use blocks detected in the response but only the first one will be processed."
+                )
+                return function_call_data, tool_call_detected
+            return {"name": content_block.name, "arguments": content_block.input}, True
+        return function_call_data, tool_call_detected

symbolicai 0.21.0__py3-none-any.whl → 1.1.0__py3-none-any.whl

symbolicai 0.21.0py3-none-any.whl → 1.1.0py3-none-any.whl