PyPI - symbolicai - Versions diffs - 0.20.2__py3-none-any.whl → 1.0.0__py3-none-any.whl - Mend

symbolicai 0.20.2py3-none-any.whl → 1.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (123) hide show

symai/__init__.py +96 -64
symai/backend/base.py +93 -80
symai/backend/engines/drawing/engine_bfl.py +12 -11
symai/backend/engines/drawing/engine_gpt_image.py +108 -87
symai/backend/engines/embedding/engine_llama_cpp.py +25 -28
symai/backend/engines/embedding/engine_openai.py +3 -5
symai/backend/engines/execute/engine_python.py +6 -5
symai/backend/engines/files/engine_io.py +74 -67
symai/backend/engines/imagecaptioning/engine_blip2.py +3 -3
symai/backend/engines/imagecaptioning/engine_llavacpp_client.py +54 -38
symai/backend/engines/index/engine_pinecone.py +23 -24
symai/backend/engines/index/engine_vectordb.py +16 -14
symai/backend/engines/lean/engine_lean4.py +38 -34
symai/backend/engines/neurosymbolic/__init__.py +41 -13
symai/backend/engines/neurosymbolic/engine_anthropic_claudeX_chat.py +262 -182
symai/backend/engines/neurosymbolic/engine_anthropic_claudeX_reasoning.py +263 -191
symai/backend/engines/neurosymbolic/engine_deepseekX_reasoning.py +53 -49
symai/backend/engines/neurosymbolic/engine_google_geminiX_reasoning.py +212 -211
symai/backend/engines/neurosymbolic/engine_groq.py +87 -63
symai/backend/engines/neurosymbolic/engine_huggingface.py +21 -24
symai/backend/engines/neurosymbolic/engine_llama_cpp.py +117 -48
symai/backend/engines/neurosymbolic/engine_openai_gptX_chat.py +256 -229
symai/backend/engines/neurosymbolic/engine_openai_gptX_reasoning.py +270 -150
symai/backend/engines/ocr/engine_apilayer.py +6 -8
symai/backend/engines/output/engine_stdout.py +1 -4
symai/backend/engines/search/engine_openai.py +7 -7
symai/backend/engines/search/engine_perplexity.py +5 -5
symai/backend/engines/search/engine_serpapi.py +12 -14
symai/backend/engines/speech_to_text/engine_local_whisper.py +20 -27
symai/backend/engines/symbolic/engine_wolframalpha.py +3 -3
symai/backend/engines/text_to_speech/engine_openai.py +5 -7
symai/backend/engines/text_vision/engine_clip.py +7 -11
symai/backend/engines/userinput/engine_console.py +3 -3
symai/backend/engines/webscraping/engine_requests.py +81 -48
symai/backend/mixin/__init__.py +13 -0
symai/backend/mixin/anthropic.py +4 -2
symai/backend/mixin/deepseek.py +2 -0
symai/backend/mixin/google.py +2 -0
symai/backend/mixin/openai.py +11 -3
symai/backend/settings.py +83 -16
symai/chat.py +101 -78
symai/collect/__init__.py +7 -1
symai/collect/dynamic.py +77 -69
symai/collect/pipeline.py +35 -27
symai/collect/stats.py +75 -63
symai/components.py +198 -169
symai/constraints.py +15 -12
symai/core.py +698 -359
symai/core_ext.py +32 -34
symai/endpoints/api.py +80 -73
symai/extended/.DS_Store +0 -0
symai/extended/__init__.py +46 -12
symai/extended/api_builder.py +11 -8
symai/extended/arxiv_pdf_parser.py +13 -12
symai/extended/bibtex_parser.py +2 -3
symai/extended/conversation.py +101 -90
symai/extended/document.py +17 -10
symai/extended/file_merger.py +18 -13
symai/extended/graph.py +18 -13
symai/extended/html_style_template.py +2 -4
symai/extended/interfaces/blip_2.py +1 -2
symai/extended/interfaces/clip.py +1 -2
symai/extended/interfaces/console.py +7 -1
symai/extended/interfaces/dall_e.py +1 -1
symai/extended/interfaces/flux.py +1 -1
symai/extended/interfaces/gpt_image.py +1 -1
symai/extended/interfaces/input.py +1 -1
symai/extended/interfaces/llava.py +0 -1
symai/extended/interfaces/naive_vectordb.py +7 -8
symai/extended/interfaces/naive_webscraping.py +1 -1
symai/extended/interfaces/ocr.py +1 -1
symai/extended/interfaces/pinecone.py +6 -5
symai/extended/interfaces/serpapi.py +1 -1
symai/extended/interfaces/terminal.py +2 -3
symai/extended/interfaces/tts.py +1 -1
symai/extended/interfaces/whisper.py +1 -1
symai/extended/interfaces/wolframalpha.py +1 -1
symai/extended/metrics/__init__.py +11 -1
symai/extended/metrics/similarity.py +11 -13
symai/extended/os_command.py +17 -16
symai/extended/packages/__init__.py +29 -3
symai/extended/packages/symdev.py +19 -16
symai/extended/packages/sympkg.py +12 -9
symai/extended/packages/symrun.py +21 -19
symai/extended/repo_cloner.py +11 -10
symai/extended/seo_query_optimizer.py +1 -2
symai/extended/solver.py +20 -23
symai/extended/summarizer.py +4 -3
symai/extended/taypan_interpreter.py +10 -12
symai/extended/vectordb.py +99 -82
symai/formatter/__init__.py +9 -1
symai/formatter/formatter.py +12 -16
symai/formatter/regex.py +62 -63
symai/functional.py +176 -122
symai/imports.py +136 -127
symai/interfaces.py +56 -27
symai/memory.py +14 -13
symai/misc/console.py +49 -39
symai/misc/loader.py +5 -3
symai/models/__init__.py +17 -1
symai/models/base.py +269 -181
symai/models/errors.py +0 -1
symai/ops/__init__.py +32 -22
symai/ops/measures.py +11 -15
symai/ops/primitives.py +348 -228
symai/post_processors.py +32 -28
symai/pre_processors.py +39 -41
symai/processor.py +6 -4
symai/prompts.py +59 -45
symai/server/huggingface_server.py +23 -20
symai/server/llama_cpp_server.py +7 -5
symai/shell.py +3 -4
symai/shellsv.py +499 -375
symai/strategy.py +517 -287
symai/symbol.py +111 -116
symai/utils.py +42 -36
{symbolicai-0.20.2.dist-info → symbolicai-1.0.0.dist-info}/METADATA +4 -2
symbolicai-1.0.0.dist-info/RECORD +163 -0
symbolicai-0.20.2.dist-info/RECORD +0 -162
{symbolicai-0.20.2.dist-info → symbolicai-1.0.0.dist-info}/WHEEL +0 -0
{symbolicai-0.20.2.dist-info → symbolicai-1.0.0.dist-info}/entry_points.txt +0 -0
{symbolicai-0.20.2.dist-info → symbolicai-1.0.0.dist-info}/licenses/LICENSE +0 -0
{symbolicai-0.20.2.dist-info → symbolicai-1.0.0.dist-info}/top_level.txt +0 -0

symai/backend/engines/neurosymbolic/engine_openai_gptX_reasoning.py CHANGED Viewed

@@ -7,9 +7,8 @@ import openai
 import tiktoken
 from ....components import SelfPrompt
-from ....misc.console import ConsoleStyle
 from ....symbol import Symbol
-from ....utils import CustomUserWarning, encode_media_frames
+from ....utils import UserMessage, encode_media_frames
 from ...base import Engine
 from ...mixin.openai import OpenAIMixin
 from ...settings import SYMAI_CONFIG
@@ -36,7 +35,7 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
         self.name = self.__class__.__name__
         try:
             self.tokenizer = tiktoken.encoding_for_model(self.model)
-        except Exception as e:
+        except Exception:
             self.tokenizer = tiktoken.get_encoding('o200k_base')
         self.max_context_tokens = self.api_max_context_tokens()
         self.max_response_tokens = self.api_max_response_tokens()
@@ -45,7 +44,7 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
         try:
             self.client = openai.Client(api_key=openai.api_key)
         except Exception as e:
-            CustomUserWarning(f'Failed to initialize OpenAI client. Please check your OpenAI library version. Caused by: {e}', raise_with=ValueError)
+            UserMessage(f'Failed to initialize OpenAI client. Please check your OpenAI library version. Caused by: {e}', raise_with=ValueError)
     def id(self) -> str:
         if self.config.get('NEUROSYMBOLIC_ENGINE_MODEL') and \
@@ -82,7 +81,7 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
             tokens_per_message = 3
             tokens_per_name = 1
         else:
-            CustomUserWarning(
+            UserMessage(
                 f"'num_tokens_from_messages()' is not implemented for model {self.model}. "
                 "See https://cookbook.openai.com/examples/how_to_count_tokens_with_tiktoken for information on how messages are converted to tokens.",
                 raise_with=NotImplementedError
@@ -92,7 +91,7 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
         for message in messages:
             num_tokens += tokens_per_message
             for key, value in message.items():
-                if type(value) == str:
+                if isinstance(value, str):
                     num_tokens += len(self.tokenizer.encode(value, disallowed_special=()))
                 else:
                     for v in value:
@@ -122,9 +121,7 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
             parts = _extract_pattern(content)
             for p in parts:
                 img_ = p.strip()
-                if img_.startswith('http'):
-                    image_files.append(img_)
-                elif img_.startswith('data:image'):
+                if img_.startswith('http') or img_.startswith('data:image'):
                     image_files.append(img_)
                 else:
                     max_frames_spacing = 50
@@ -134,7 +131,7 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
                         max_used_frames, img_ = img_.split(':')
                         max_used_frames = int(max_used_frames)
                         if max_used_frames < 1 or max_used_frames > max_frames_spacing:
-                            CustomUserWarning(f"Invalid max_used_frames value: {max_used_frames}. Expected value between 1 and {max_frames_spacing}", raise_with=ValueError)
+                            UserMessage(f"Invalid max_used_frames value: {max_used_frames}. Expected value between 1 and {max_frames_spacing}", raise_with=ValueError)
                     buffer, ext = encode_media_frames(img_)
                     if len(buffer) > 1:
                         step = len(buffer) // max_frames_spacing # max frames spacing
@@ -146,7 +143,7 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
                     elif len(buffer) == 1:
                         image_files.append(f"data:image/{ext};base64,{buffer[0]}")
                     else:
-                        print('No frames found or error in encoding frames')
+                        UserMessage('No frames found or error in encoding frames')
         return image_files
     def _remove_vision_pattern(self, text: str) -> str:
@@ -154,16 +151,79 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
         pattern = r'<<vision:(.*?):>>'
         return re.sub(pattern, '', text)
-    def truncate(self, prompts: list[dict], truncation_percentage: float | None, truncation_type: str) -> list[dict]:
-        """Main truncation method"""
-        def _slice_tokens(tokens, new_len, truncation_type):
-            """Slice tokens based on truncation type"""
-            new_len = max(100, new_len)  # Ensure minimum token length
-            return tokens[-new_len:] if truncation_type == 'head' else tokens[:new_len] # else 'tail'
+    def _slice_tokens(self, tokens, new_len, truncation_type):
+        """Slice tokens based on truncation type."""
+        new_len = max(100, new_len)  # Ensure minimum token length
+        return tokens[-new_len:] if truncation_type == 'head' else tokens[:new_len]  # else 'tail'
+    def _validate_truncation_prompts(self, prompts: list[dict]) -> bool:
+        """Validate prompt structure before truncation."""
         if len(prompts) != 2 and all(prompt['role'] in ['developer', 'user'] for prompt in prompts):
             # Only support developer and user prompts
-            CustomUserWarning(f"Token truncation currently supports only two messages, from 'user' and 'developer' (got {len(prompts)}). Returning original prompts.")
+            UserMessage(
+                f"Token truncation currently supports only two messages, from 'user' and 'developer' (got {len(prompts)}). Returning original prompts."
+            )
+            return False
+        return True
+    def _collect_user_tokens(
+        self,
+        user_prompt: dict,
+    ) -> tuple[list[int], bool]:
+        """Collect user tokens and detect unsupported content."""
+        user_tokens: list[int] = []
+        user_content = user_prompt['content']
+        if isinstance(user_content, str):
+            user_tokens.extend(Symbol(user_content).tokens)
+            return user_tokens, False
+        if isinstance(user_content, list):
+            for content_item in user_content:
+                if isinstance(content_item, dict):
+                    if content_item.get('type') == 'text':
+                        user_tokens.extend(Symbol(content_item['text']).tokens)
+                    else:
+                        return user_tokens, True
+                else:
+                    UserMessage(
+                        f"Invalid content type: {type(content_item)}. Format input according to the documentation. See https://platform.openai.com/docs/api-reference/chat/create?lang=python",
+                        raise_with=ValueError,
+                    )
+            return user_tokens, False
+        return UserMessage(
+            f"Unknown content type: {type(user_prompt['content'])}. Format input according to the documentation. See https://platform.openai.com/docs/api-reference/chat/create?lang=python",
+            raise_with=ValueError,
+        )
+    def _truncate_single_prompt_exceed(
+        self,
+        system_tokens,
+        user_tokens,
+        system_token_count,
+        user_token_count,
+        max_prompt_tokens,
+        truncation_type,
+    ):
+        """Handle truncation when only one prompt exceeds the limit."""
+        half_limit = max_prompt_tokens / 2
+        if user_token_count > half_limit and system_token_count <= half_limit:
+            new_user_len = max_prompt_tokens - system_token_count
+            new_user_tokens = self._slice_tokens(user_tokens, new_user_len, truncation_type)
+            return [
+                {'role': 'developer', 'content': self.tokenizer.decode(system_tokens)},
+                {'role': 'user', 'content': [{'type': 'text', 'text': self.tokenizer.decode(new_user_tokens)}]},
+            ]
+        if system_token_count > half_limit and user_token_count <= half_limit:
+            new_system_len = max_prompt_tokens - user_token_count
+            new_system_tokens = self._slice_tokens(system_tokens, new_system_len, truncation_type)
+            return [
+                {'role': 'developer', 'content': self.tokenizer.decode(new_system_tokens)},
+                {'role': 'user', 'content': [{'type': 'text', 'text': self.tokenizer.decode(user_tokens)}]},
+            ]
+        return None
+    def truncate(self, prompts: list[dict], truncation_percentage: float | None, truncation_type: str) -> list[dict]:
+        """Main truncation method"""
+        if not self._validate_truncation_prompts(prompts):
             return prompts
         if truncation_percentage is None:
@@ -177,23 +237,9 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
         system_tokens = Symbol(system_prompt['content']).tokens
         user_tokens = []
-        if isinstance(user_prompt['content'], str):
-            # Default input format
-            user_tokens.extend(Symbol(user_prompt['content']).tokens)
-        elif isinstance(user_prompt['content'], list):
-            for content_item in user_prompt['content']:
-                # Image input format
-                if isinstance(content_item, dict):
-                    if content_item.get('type') == 'text':
-                        user_tokens.extend(Symbol(content_item['text']).tokens)
-                    else:
-                        # Image content; return original since not supported
-                        return prompts
-                else:
-                    CustomUserWarning(f"Invalid content type: {type(content_item)}. Format input according to the documentation. See https://platform.openai.com/docs/api-reference/chat/create?lang=python", raise_with=ValueError)
-        else:
-            # Unknown input format
-            CustomUserWarning(f"Unknown content type: {type(user_prompt['content'])}. Format input according to the documentation. See https://platform.openai.com/docs/api-reference/chat/create?lang=python", raise_with=ValueError)
+        user_tokens, should_return_original = self._collect_user_tokens(user_prompt)
+        if should_return_original:
+            return prompts
         system_token_count = len(system_tokens)
         user_token_count = len(user_tokens)
@@ -208,7 +254,7 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
         if total_tokens <= max_prompt_tokens:
             return prompts
-        CustomUserWarning(
+        UserMessage(
             f"Executing {truncation_type} truncation to fit within {max_prompt_tokens} tokens. "
             f"Combined prompts ({total_tokens} tokens) exceed maximum allowed tokens "
             f"of {max_prompt_tokens} ({truncation_percentage*100:.1f}% of context). "
@@ -218,23 +264,16 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
             f"Choose 'truncation_type' as 'head' to keep the end of prompts or 'tail' to keep the beginning."
         )
-        # Case 1: Only user prompt exceeds
-        if user_token_count > max_prompt_tokens/2 and system_token_count <= max_prompt_tokens/2:
-            new_user_len = max_prompt_tokens - system_token_count
-            new_user_tokens = _slice_tokens(user_tokens, new_user_len, truncation_type)
-            return [
-                {'role': 'developer', 'content': self.tokenizer.decode(system_tokens)},
-                {'role': 'user', 'content': [{'type': 'text', 'text': self.tokenizer.decode(new_user_tokens)}]}
-            ]
-        # Case 2: Only developer prompt exceeds
-        if system_token_count > max_prompt_tokens/2 and user_token_count <= max_prompt_tokens/2:
-            new_system_len = max_prompt_tokens - user_token_count
-            new_system_tokens = _slice_tokens(system_tokens, new_system_len, truncation_type)
-            return [
-                {'role': 'developer', 'content': self.tokenizer.decode(new_system_tokens)},
-                {'role': 'user', 'content': [{'type': 'text', 'text': self.tokenizer.decode(user_tokens)}]}
-            ]
+        single_prompt_adjustment = self._truncate_single_prompt_exceed(
+            system_tokens,
+            user_tokens,
+            system_token_count,
+            user_token_count,
+            max_prompt_tokens,
+            truncation_type,
+        )
+        if single_prompt_adjustment is not None:
+            return single_prompt_adjustment
         # Case 3: Both exceed - reduce proportionally
         system_ratio = system_token_count / total_tokens
@@ -246,8 +285,8 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
         new_system_len += distribute_tokens // 2
         new_user_len += distribute_tokens // 2
-        new_system_tokens = _slice_tokens(system_tokens, new_system_len, truncation_type)
-        new_user_tokens = _slice_tokens(user_tokens, new_user_len, truncation_type)
+        new_system_tokens = self._slice_tokens(system_tokens, new_system_len, truncation_type)
+        new_user_tokens = self._slice_tokens(user_tokens, new_user_len, truncation_type)
         return [
             {'role': 'developer', 'content': self.tokenizer.decode(new_system_tokens)},
@@ -268,18 +307,18 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
         except Exception as e:
             if openai.api_key is None or openai.api_key == '':
                 msg = 'OpenAI API key is not set. Please set it in the config file or pass it as an argument to the command method.'
-                logging.error(msg)
+                UserMessage(msg)
                 if self.config['NEUROSYMBOLIC_ENGINE_API_KEY'] is None or self.config['NEUROSYMBOLIC_ENGINE_API_KEY'] == '':
-                    CustomUserWarning(msg, raise_with=ValueError)
+                    UserMessage(msg, raise_with=ValueError)
                 openai.api_key = self.config['NEUROSYMBOLIC_ENGINE_API_KEY']
             callback = self.client.chat.completions.create
-            kwargs['model'] = kwargs['model'] if 'model' in kwargs else self.model
+            kwargs['model'] = kwargs.get('model', self.model)
             if except_remedy is not None:
                 res = except_remedy(self, e, callback, argument)
             else:
-                CustomUserWarning(f'Error during generation. Caused by: {e}', raise_with=ValueError)
+                UserMessage(f'Error during generation. Caused by: {e}', raise_with=ValueError)
         metadata = {'raw_output': res}
         if payload.get('tools'):
@@ -290,95 +329,173 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
     def _prepare_raw_input(self, argument):
         if not argument.prop.processed_input:
-            CustomUserWarning('Need to provide a prompt instruction to the engine if raw_input is enabled.', raise_with=ValueError)
+            UserMessage('Need to provide a prompt instruction to the engine if raw_input is enabled.', raise_with=ValueError)
         value = argument.prop.processed_input
         # convert to dict if not already
-        if type(value) != list:
-            if type(value) != dict:
+        if not isinstance(value, list):
+            if not isinstance(value, dict):
                 value = {'role': 'user', 'content': str(value)}
             value = [value]
         return value
-    def prepare(self, argument):
-        if argument.prop.raw_input:
-            argument.prop.prepared_input = self._prepare_raw_input(argument)
-            return
-        _non_verbose_output = """<META_INSTRUCTION/>\nYou do not output anything else, like verbose preambles or post explanation, such as "Sure, let me...", "Hope that was helpful...", "Yes, I can help you with that...", etc. Consider well formatted output, e.g. for sentences use punctuation, spaces etc. or for code use indentation, etc. Never add meta instructions information to your output!\n\n"""
-        user:   str = ""
-        developer: str = ""
+    def _non_verbose_section(self, argument) -> str:
+        """Return non-verbose instruction section if needed."""
         if argument.prop.suppress_verbose_output:
-            developer += _non_verbose_output
-        developer = f'{developer}\n' if developer and len(developer) > 0 else ''
-        if argument.prop.response_format:
-            _rsp_fmt = argument.prop.response_format
-            assert _rsp_fmt.get('type') is not None, 'Expected format `{ "type": "json_object" }`! See https://platform.openai.com/docs/api-reference/chat/create#chat-create-response_format'
-            if _rsp_fmt["type"] == "json_object":
-                # OpenAI docs:
-                    # "Important: when using JSON mode, you must also instruct the model
-                    #  to produce JSON yourself via a developer or user message"
-                developer += f'<RESPONSE_FORMAT/>\nYou are a helpful assistant designed to output JSON.\n\n'
-        ref = argument.prop.instance
-        static_ctxt, dyn_ctxt = ref.global_context
+            return (
+                "<META_INSTRUCTION/>\n"
+                "You do not output anything else, like verbose preambles or post explanation, such as "
+                "\"Sure, let me...\", \"Hope that was helpful...\", \"Yes, I can help you with that...\", etc. "
+                "Consider well formatted output, e.g. for sentences use punctuation, spaces etc. or for code use "
+                "indentation, etc. Never add meta instructions information to your output!\n\n"
+            )
+        return ''
+    def _response_format_section(self, argument) -> str:
+        """Return response format instructions if provided."""
+        if not argument.prop.response_format:
+            return ''
+        response_format = argument.prop.response_format
+        assert response_format.get('type') is not None, 'Expected format `{ "type": "json_object" }`! See https://platform.openai.com/docs/api-reference/chat/create#chat-create-response_format'
+        if response_format["type"] == "json_object":
+            return '<RESPONSE_FORMAT/>\nYou are a helpful assistant designed to output JSON.\n\n'
+        return ''
+    def _context_sections(self, argument) -> list[str]:
+        """Return static and dynamic context sections."""
+        sections: list[str] = []
+        static_ctxt, dyn_ctxt = argument.prop.instance.global_context
         if len(static_ctxt) > 0:
-            developer += f"<STATIC CONTEXT/>\n{static_ctxt}\n\n"
+            sections.append(f"<STATIC CONTEXT/>\n{static_ctxt}\n\n")
         if len(dyn_ctxt) > 0:
-            developer += f"<DYNAMIC CONTEXT/>\n{dyn_ctxt}\n\n"
+            sections.append(f"<DYNAMIC CONTEXT/>\n{dyn_ctxt}\n\n")
+        return sections
-        payload = argument.prop.payload
+    def _additional_context_section(self, argument) -> str:
+        """Return additional payload context if any."""
         if argument.prop.payload:
-            developer += f"<ADDITIONAL CONTEXT/>\n{str(payload)}\n\n"
+            return f"<ADDITIONAL CONTEXT/>\n{argument.prop.payload!s}\n\n"
+        return ''
+    def _examples_section(self, argument) -> str:
+        """Return examples section if provided."""
         examples: list[str] = argument.prop.examples
         if examples and len(examples) > 0:
-            developer += f"<EXAMPLES/>\n{str(examples)}\n\n"
-        image_files = self._handle_image_content(str(argument.prop.processed_input))
+            return f"<EXAMPLES/>\n{examples!s}\n\n"
+        return ''
+    def _instruction_section(self, argument, image_files: list[str]) -> str:
+        """Return instruction section, removing vision patterns when needed."""
+        prompt = argument.prop.prompt
+        if prompt is None or len(prompt) == 0:
+            return ''
+        value = str(prompt)
+        if len(image_files) > 0:
+            value = self._remove_vision_pattern(value)
+        return f"<INSTRUCTION/>\n{value}\n\n"
+    def _build_developer_prompt(self, argument, image_files: list[str]) -> str:
+        """Assemble developer prompt content."""
+        developer = self._non_verbose_section(argument)
+        developer = f'{developer}\n' if developer else ''
+        parts = [
+            self._response_format_section(argument),
+            *self._context_sections(argument),
+            self._additional_context_section(argument),
+            self._examples_section(argument),
+            self._instruction_section(argument, image_files),
+        ]
+        developer += ''.join(part for part in parts if part)
-        if argument.prop.prompt is not None and len(argument.prop.prompt) > 0:
-            val = str(argument.prop.prompt)
-            if len(image_files) > 0:
-                val = self._remove_vision_pattern(val)
-            developer += f"<INSTRUCTION/>\n{val}\n\n"
+        if argument.prop.template_suffix:
+            developer += (
+                f' You will only generate content for the placeholder `{argument.prop.template_suffix!s}` '
+                'following the instructions and the provided context information.\n\n'
+            )
+        return developer
+    def _build_user_suffix(self, argument, image_files: list[str]) -> str:
+        """Prepare user content suffix."""
         suffix: str = str(argument.prop.processed_input)
         if len(image_files) > 0:
             suffix = self._remove_vision_pattern(suffix)
+        return suffix
-        user += f"{suffix}"
+    def _construct_user_prompt(self, user_text: str, image_files: list[str]):
+        """Construct user prompt payload."""
+        if self.model in {
+                'o1',
+                'o3',
+                'o3-mini',
+                'o4-mini',
+                'gpt-5',
+                'gpt-5-mini',
+                'gpt-5-nano',
+            }:
+            images = [{'type': 'image_url', 'image_url': {'url': file}} for file in image_files]
+            user_prompt = {
+                "role": "user",
+                "content": [
+                    *images,
+                    {'type': 'text', 'text': user_text},
+                ],
+            }
+            return user_prompt, images
+        return {"role": "user", "content": user_text}, None
+    def _apply_self_prompt(
+        self,
+        argument,
+        user_prompt,
+        developer: str,
+        user_text: str,
+        images,
+        image_files: list[str],
+    ):
+        """Apply self-prompting when requested."""
+        instance = argument.prop.instance
+        if not (instance._kwargs.get('self_prompt', False) or argument.prop.self_prompt):
+            return user_prompt, developer
+        self_prompter = SelfPrompt()
+        res = self_prompter({'user': user_text, 'developer': developer})
+        if res is None:
+            UserMessage("Self-prompting failed!", raise_with=ValueError)
-        if argument.prop.template_suffix:
-            developer += f' You will only generate content for the placeholder `{str(argument.prop.template_suffix)}` following the instructions and the provided context information.\n\n'
-        if self.model == 'o1':
-            images = [{ 'type': 'image_url', "image_url": { "url": file }} for file in image_files]
-            user_prompt = { "role": "user", "content": [
-                *images,
-                { 'type': 'text', 'text': user }
-            ]}
+        if len(image_files) > 0:
+            image_content = images if images is not None else [
+                {'type': 'image_url', 'image_url': {'url': file}} for file in image_files
+            ]
+            user_prompt = {
+                "role": "user",
+                "content": [
+                    *image_content,
+                    {'type': 'text', 'text': res['user']},
+                ],
+            }
         else:
-            user_prompt = { "role": "user", "content": user }
+            user_prompt = {"role": "user", "content": res['user']}
-        # First check if the `Symbol` instance has the flag set, otherwise check if it was passed as an argument to a method
-        if argument.prop.instance._kwargs.get('self_prompt', False) or argument.prop.self_prompt:
-            self_prompter = SelfPrompt()
-            res = self_prompter({'user': user, 'developer': developer})
-            if res is None:
-                CustomUserWarning("Self-prompting failed!", raise_with=ValueError)
+        return user_prompt, res['developer']
-            if len(image_files) > 0:
-                user_prompt = { "role": "user", "content": [
-                    *images,
-                    { 'type': 'text', 'text': res['user'] }
-                ]}
-            else:
-                user_prompt = { "role": "user", "content": res['user'] }
+    def prepare(self, argument):
+        if argument.prop.raw_input:
+            argument.prop.prepared_input = self._prepare_raw_input(argument)
+            return
+        image_files = self._handle_image_content(str(argument.prop.processed_input))
-            developer = res['developer']
+        developer = self._build_developer_prompt(argument, image_files)
+        user_text = self._build_user_suffix(argument, image_files)
+        user_prompt, images = self._construct_user_prompt(user_text, image_files)
+        user_prompt, developer = self._apply_self_prompt(
+            argument,
+            user_prompt,
+            developer,
+            user_text,
+            images,
+            image_files,
+        )
         argument.prop.prepared_input = [
             { "role": "developer", "content": developer },
@@ -387,24 +504,28 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
     def _process_function_calls(self, res, metadata):
         hit = False
-        if hasattr(res, 'choices') and res.choices:
-            choice = res.choices[0]
-            if hasattr(choice, 'message') and choice.message:
-                if hasattr(choice.message, 'tool_calls') and choice.message.tool_calls:
-                    for tool_call in choice.message.tool_calls:
-                        if hit:
-                            CustomUserWarning("Multiple function calls detected in the response but only the first one will be processed.")
-                            break
-                        if hasattr(tool_call, 'function') and tool_call.function:
-                            try:
-                                args_dict = json.loads(tool_call.function.arguments)
-                            except json.JSONDecodeError:
-                                args_dict = {}
-                            metadata['function_call'] = {
-                                'name': tool_call.function.name,
-                                'arguments': args_dict
-                            }
-                            hit = True
+        if (
+            hasattr(res, 'choices')
+            and res.choices
+            and hasattr(res.choices[0], 'message')
+            and res.choices[0].message
+            and hasattr(res.choices[0].message, 'tool_calls')
+            and res.choices[0].message.tool_calls
+        ):
+            for tool_call in res.choices[0].message.tool_calls:
+                if hit:
+                    UserMessage("Multiple function calls detected in the response but only the first one will be processed.")
+                    break
+                if hasattr(tool_call, 'function') and tool_call.function:
+                    try:
+                        args_dict = json.loads(tool_call.function.arguments)
+                    except json.JSONDecodeError:
+                        args_dict = {}
+                    metadata['function_call'] = {
+                        'name': tool_call.function.name,
+                        'arguments': args_dict
+                    }
+                    hit = True
         return metadata
     def _prepare_request_payload(self, messages, argument):
@@ -416,13 +537,13 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
         remaining_tokens = self.compute_remaining_tokens(messages)
         if max_tokens is not None:
-            CustomUserWarning(
+            UserMessage(
                 "'max_tokens' is now deprecated in favor of 'max_completion_tokens', and is not compatible with o1 series models. "
                 "We handle this conversion by default for you for now but we won't in the future. "
                 "See: https://platform.openai.com/docs/api-reference/chat/create"
             )
             if max_tokens > self.max_response_tokens:
-                CustomUserWarning(
+                UserMessage(
                     f"Provided 'max_tokens' ({max_tokens}) exceeds max response tokens ({self.max_response_tokens}). "
                     f"Truncating to {remaining_tokens} to avoid API failure."
                 )
@@ -431,13 +552,12 @@ class GPTXReasoningEngine(Engine, OpenAIMixin):
                 kwargs['max_completion_tokens'] = max_tokens
             del kwargs['max_tokens']
-        if max_completion_tokens is not None:
-            if max_completion_tokens > self.max_response_tokens:
-                CustomUserWarning(
-                    f"Provided 'max_completion_tokens' ({max_completion_tokens}) exceeds max response tokens ({self.max_response_tokens}). "
-                    f"Truncating to {remaining_tokens} to avoid API failure."
-                )
-                kwargs['max_completion_tokens'] = remaining_tokens
+        if max_completion_tokens is not None and max_completion_tokens > self.max_response_tokens:
+            UserMessage(
+                f"Provided 'max_completion_tokens' ({max_completion_tokens}) exceeds max response tokens ({self.max_response_tokens}). "
+                f"Truncating to {remaining_tokens} to avoid API failure."
+            )
+            kwargs['max_completion_tokens'] = remaining_tokens
         payload = {
             "messages": messages,

symai/backend/engines/ocr/engine_apilayer.py CHANGED Viewed

@@ -1,11 +1,10 @@
-import requests
 from pathlib import Path
-from typing import Optional
+import requests
+from ....symbol import Result
 from ...base import Engine
 from ...settings import SYMAI_CONFIG
-from ....symbol import Result
 class ApiLayerResult(Result):
@@ -14,13 +13,13 @@ class ApiLayerResult(Result):
         self.raw = text
         try:
             dict_ = self._to_symbol(text).ast()
-            self._value = dict_['all_text'] if 'all_text' in dict_ else f'OCR Engine Error: {text} - status code {status_code}'
-        except:
+            self._value = dict_.get('all_text', f'OCR Engine Error: {text} - status code {status_code}')
+        except Exception:
             self._value = f'OCR Engine Error: {text} - status code {status_code}'
 class OCREngine(Engine):
-    def __init__(self, api_key: Optional[str] = None):
+    def __init__(self, api_key: str | None = None):
         super().__init__()
         # Opening JSON file
         self.config = SYMAI_CONFIG
@@ -42,12 +41,11 @@ class OCREngine(Engine):
             }
     def forward(self, argument):
-        kwargs    = argument.kwargs
         image_url = argument.prop.image
         if image_url.startswith("file://"):
             file_path = Path(image_url[7:]).resolve()
-            with open(file_path, "rb") as file:
+            with file_path.open("rb") as file:
                 payload = file.read()
             url      = "https://api.apilayer.com/image_to_text/upload"
             response = requests.request("POST", url, headers=self.headers, data=payload)

symai/backend/engines/output/engine_stdout.py CHANGED Viewed

@@ -15,10 +15,7 @@ class OutputEngine(Engine):
         args = [] if args is None else args
         kwargs = {} if kwargs is None else kwargs
         if expr:
-            if processed:
-                res = expr(processed, *args, **kwargs)
-            else:
-                res = expr(*args, **kwargs)
+            res = expr(processed, *args, **kwargs) if processed else expr(*args, **kwargs)
         metadata = {}
         result   = {

symbolicai 0.20.2__py3-none-any.whl → 1.0.0__py3-none-any.whl

symbolicai 0.20.2py3-none-any.whl → 1.0.0py3-none-any.whl