PyPI - symbolicai - Versions diffs - 0.21.0__py3-none-any.whl → 1.1.0__py3-none-any.whl - Mend

symbolicai 0.21.0py3-none-any.whl → 1.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (134) hide show

symai/__init__.py +269 -173
symai/backend/base.py +123 -110
symai/backend/engines/drawing/engine_bfl.py +45 -44
symai/backend/engines/drawing/engine_gpt_image.py +112 -97
symai/backend/engines/embedding/engine_llama_cpp.py +63 -52
symai/backend/engines/embedding/engine_openai.py +25 -21
symai/backend/engines/execute/engine_python.py +19 -18
symai/backend/engines/files/engine_io.py +104 -95
symai/backend/engines/imagecaptioning/engine_blip2.py +28 -24
symai/backend/engines/imagecaptioning/engine_llavacpp_client.py +102 -79
symai/backend/engines/index/engine_pinecone.py +124 -97
symai/backend/engines/index/engine_qdrant.py +1011 -0
symai/backend/engines/index/engine_vectordb.py +84 -56
symai/backend/engines/lean/engine_lean4.py +96 -52
symai/backend/engines/neurosymbolic/__init__.py +41 -13
symai/backend/engines/neurosymbolic/engine_anthropic_claudeX_chat.py +330 -248
symai/backend/engines/neurosymbolic/engine_anthropic_claudeX_reasoning.py +329 -264
symai/backend/engines/neurosymbolic/engine_cerebras.py +328 -0
symai/backend/engines/neurosymbolic/engine_deepseekX_reasoning.py +118 -88
symai/backend/engines/neurosymbolic/engine_google_geminiX_reasoning.py +344 -299
symai/backend/engines/neurosymbolic/engine_groq.py +173 -115
symai/backend/engines/neurosymbolic/engine_huggingface.py +114 -84
symai/backend/engines/neurosymbolic/engine_llama_cpp.py +144 -118
symai/backend/engines/neurosymbolic/engine_openai_gptX_chat.py +415 -307
symai/backend/engines/neurosymbolic/engine_openai_gptX_reasoning.py +394 -231
symai/backend/engines/ocr/engine_apilayer.py +23 -27
symai/backend/engines/output/engine_stdout.py +10 -13
symai/backend/engines/{webscraping → scrape}/engine_requests.py +101 -54
symai/backend/engines/search/engine_openai.py +100 -88
symai/backend/engines/search/engine_parallel.py +665 -0
symai/backend/engines/search/engine_perplexity.py +44 -45
symai/backend/engines/search/engine_serpapi.py +37 -34
symai/backend/engines/speech_to_text/engine_local_whisper.py +54 -51
symai/backend/engines/symbolic/engine_wolframalpha.py +15 -9
symai/backend/engines/text_to_speech/engine_openai.py +20 -26
symai/backend/engines/text_vision/engine_clip.py +39 -37
symai/backend/engines/userinput/engine_console.py +5 -6
symai/backend/mixin/__init__.py +13 -0
symai/backend/mixin/anthropic.py +48 -38
symai/backend/mixin/deepseek.py +6 -5
symai/backend/mixin/google.py +7 -4
symai/backend/mixin/groq.py +2 -4
symai/backend/mixin/openai.py +140 -110
symai/backend/settings.py +87 -20
symai/chat.py +216 -123
symai/collect/__init__.py +7 -1
symai/collect/dynamic.py +80 -70
symai/collect/pipeline.py +67 -51
symai/collect/stats.py +161 -109
symai/components.py +707 -360
symai/constraints.py +24 -12
symai/core.py +1857 -1233
symai/core_ext.py +83 -80
symai/endpoints/api.py +166 -104
symai/extended/.DS_Store +0 -0
symai/extended/__init__.py +46 -12
symai/extended/api_builder.py +29 -21
symai/extended/arxiv_pdf_parser.py +23 -14
symai/extended/bibtex_parser.py +9 -6
symai/extended/conversation.py +156 -126
symai/extended/document.py +50 -30
symai/extended/file_merger.py +57 -14
symai/extended/graph.py +51 -32
symai/extended/html_style_template.py +18 -14
symai/extended/interfaces/blip_2.py +2 -3
symai/extended/interfaces/clip.py +4 -3
symai/extended/interfaces/console.py +9 -1
symai/extended/interfaces/dall_e.py +4 -2
symai/extended/interfaces/file.py +2 -0
symai/extended/interfaces/flux.py +4 -2
symai/extended/interfaces/gpt_image.py +16 -7
symai/extended/interfaces/input.py +2 -1
symai/extended/interfaces/llava.py +1 -2
symai/extended/interfaces/{naive_webscraping.py → naive_scrape.py} +4 -3
symai/extended/interfaces/naive_vectordb.py +9 -10
symai/extended/interfaces/ocr.py +5 -3
symai/extended/interfaces/openai_search.py +2 -0
symai/extended/interfaces/parallel.py +30 -0
symai/extended/interfaces/perplexity.py +2 -0
symai/extended/interfaces/pinecone.py +12 -9
symai/extended/interfaces/python.py +2 -0
symai/extended/interfaces/serpapi.py +3 -1
symai/extended/interfaces/terminal.py +2 -4
symai/extended/interfaces/tts.py +3 -2
symai/extended/interfaces/whisper.py +3 -2
symai/extended/interfaces/wolframalpha.py +2 -1
symai/extended/metrics/__init__.py +11 -1
symai/extended/metrics/similarity.py +14 -13
symai/extended/os_command.py +39 -29
symai/extended/packages/__init__.py +29 -3
symai/extended/packages/symdev.py +51 -43
symai/extended/packages/sympkg.py +41 -35
symai/extended/packages/symrun.py +63 -50
symai/extended/repo_cloner.py +14 -12
symai/extended/seo_query_optimizer.py +15 -13
symai/extended/solver.py +116 -91
symai/extended/summarizer.py +12 -10
symai/extended/taypan_interpreter.py +17 -18
symai/extended/vectordb.py +122 -92
symai/formatter/__init__.py +9 -1
symai/formatter/formatter.py +51 -47
symai/formatter/regex.py +70 -69
symai/functional.py +325 -176
symai/imports.py +190 -147
symai/interfaces.py +57 -28
symai/memory.py +45 -35
symai/menu/screen.py +28 -19
symai/misc/console.py +66 -56
symai/misc/loader.py +8 -5
symai/models/__init__.py +17 -1
symai/models/base.py +395 -236
symai/models/errors.py +1 -2
symai/ops/__init__.py +32 -22
symai/ops/measures.py +24 -25
symai/ops/primitives.py +1149 -731
symai/post_processors.py +58 -50
symai/pre_processors.py +86 -82
symai/processor.py +21 -13
symai/prompts.py +764 -685
symai/server/huggingface_server.py +135 -49
symai/server/llama_cpp_server.py +21 -11
symai/server/qdrant_server.py +206 -0
symai/shell.py +100 -42
symai/shellsv.py +700 -492
symai/strategy.py +630 -346
symai/symbol.py +368 -322
symai/utils.py +100 -78
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/METADATA +22 -10
symbolicai-1.1.0.dist-info/RECORD +168 -0
symbolicai-0.21.0.dist-info/RECORD +0 -162
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/WHEEL +0 -0
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/entry_points.txt +0 -0
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/licenses/LICENSE +0 -0
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/top_level.txt +0 -0

symai/backend/engines/neurosymbolic/engine_google_geminiX_reasoning.py CHANGED Viewed

@@ -1,9 +1,7 @@
 import base64
-import io
 import logging
 import mimetypes
 import re
-import urllib.parse
 from copy import deepcopy
 from pathlib import Path
@@ -12,9 +10,7 @@ from google import genai
 from google.genai import types
 from ....components import SelfPrompt
-from ....misc.console import ConsoleStyle
-from ....symbol import Symbol
-from ....utils import CustomUserWarning, encode_media_frames
+from ....utils import UserMessage, encode_media_frames
 from ...base import Engine
 from ...mixin.google import GoogleMixin
 from ...settings import SYMAI_CONFIG
@@ -34,19 +30,20 @@ class TokenizerWrapper:
     def encode(self, text: str) -> int:
         return self.compute_tokens_func([{"role": "user", "content": text}])
 class GeminiXReasoningEngine(Engine, GoogleMixin):
     def __init__(self, api_key: str | None = None, model: str | None = None):
         super().__init__()
         self.config = deepcopy(SYMAI_CONFIG)
         # In case we use EngineRepository.register to inject the api_key and model => dynamically change the engine at runtime
         if api_key is not None and model is not None:
-            self.config['NEUROSYMBOLIC_ENGINE_API_KEY'] = api_key
-            self.config['NEUROSYMBOLIC_ENGINE_MODEL'] = model
-        if self.id() != 'neurosymbolic':
-            return # do not initialize if not neurosymbolic; avoids conflict with llama.cpp check in EngineRepository.register_from_package
+            self.config["NEUROSYMBOLIC_ENGINE_API_KEY"] = api_key
+            self.config["NEUROSYMBOLIC_ENGINE_MODEL"] = model
+        if self.id() != "neurosymbolic":
+            return  # do not initialize if not neurosymbolic; avoids conflict with llama.cpp check in EngineRepository.register_from_package
-        self.api_key = self.config['NEUROSYMBOLIC_ENGINE_API_KEY']
-        self.model = self.config['NEUROSYMBOLIC_ENGINE_MODEL']
+        self.api_key = self.config["NEUROSYMBOLIC_ENGINE_API_KEY"]
+        self.model = self.config["NEUROSYMBOLIC_ENGINE_MODEL"]
         self.name = self.__class__.__name__
         self.tokenizer = TokenizerWrapper(self.compute_required_tokens)
         self.max_context_tokens = self.api_max_context_tokens()
@@ -54,33 +51,32 @@ class GeminiXReasoningEngine(Engine, GoogleMixin):
         self.client = genai.Client(api_key=self.api_key)
     def id(self) -> str:
-        model = self.config.get('NEUROSYMBOLIC_ENGINE_MODEL')
-        if model and model.startswith('gemini'):
-            return 'neurosymbolic'
-        return super().id() # default to unregistered
+        model = self.config.get("NEUROSYMBOLIC_ENGINE_MODEL")
+        if model and model.startswith("gemini"):
+            return "neurosymbolic"
+        return super().id()  # default to unregistered
     def command(self, *args, **kwargs):
         super().command(*args, **kwargs)
-        if 'NEUROSYMBOLIC_ENGINE_API_KEY' in kwargs:
-            self.api_key = kwargs['NEUROSYMBOLIC_ENGINE_API_KEY']
+        if "NEUROSYMBOLIC_ENGINE_API_KEY" in kwargs:
+            self.api_key = kwargs["NEUROSYMBOLIC_ENGINE_API_KEY"]
             genai.configure(api_key=self.api_key)
-        if 'NEUROSYMBOLIC_ENGINE_MODEL' in kwargs:
-            self.model = kwargs['NEUROSYMBOLIC_ENGINE_MODEL']
+        if "NEUROSYMBOLIC_ENGINE_MODEL" in kwargs:
+            self.model = kwargs["NEUROSYMBOLIC_ENGINE_MODEL"]
             self.client = genai.GenerativeModel(model_name=self.model)
     def compute_required_tokens(self, messages) -> int:
         api_contents: list[types.Content] = []
         for msg in messages:
-            if not isinstance(msg, list):
-                msg = [msg]
-            for part in msg:
+            msg_parts = msg if isinstance(msg, list) else [msg]
+            for part in msg_parts:
                 if isinstance(part, str):
-                    role = 'user'
+                    role = "user"
                     content_str = part
                 elif isinstance(part, dict):
-                    role = part.get('role')
-                    content_str = str(part.get('content', ''))
+                    role = part.get("role")
+                    content_str = str(part.get("content", ""))
                 current_message_api_parts: list[types.Part] = []
                 image_api_parts = self._handle_image_content(content_str)
                 current_message_api_parts.extend(image_api_parts)
@@ -96,168 +92,180 @@ class GeminiXReasoningEngine(Engine, GoogleMixin):
             return 0
         try:
-            count_response = self.client.models.count_tokens(model=self.model, contents=api_contents)
+            count_response = self.client.models.count_tokens(
+                model=self.model, contents=api_contents
+            )
             return count_response.total_tokens
         except Exception as e:
-            logging.error(f"Gemini count_tokens failed: {e}")
-            CustomUserWarning(f"Error counting tokens for Gemini: {str(e)}", raise_with=RuntimeError)
+            UserMessage(f"Gemini count_tokens failed: {e}")
+            UserMessage(f"Error counting tokens for Gemini: {e!s}", raise_with=RuntimeError)
-    def compute_remaining_tokens(self, prompts: list) -> int:
-        CustomUserWarning("Token counting not implemented for Gemini", raise_with=NotImplementedError)
+    def compute_remaining_tokens(self, _prompts: list) -> int:
+        UserMessage("Token counting not implemented for Gemini", raise_with=NotImplementedError)
     def _handle_document_content(self, content: str):
         """Handle document content by uploading to Gemini"""
         try:
-            pattern = r'<<document:(.*?):>>'
+            pattern = r"<<document:(.*?):>>"
             matches = re.findall(pattern, content)
             if not matches:
                 return None
             doc_path = matches[0].strip()
-            if doc_path.startswith('http'):
-                CustomUserWarning("URL documents not yet supported for Gemini")
+            if doc_path.startswith("http"):
+                UserMessage("URL documents not yet supported for Gemini")
                 return None
-            else:
-                uploaded_file = genai.upload_file(doc_path)
-                return uploaded_file
+            return genai.upload_file(doc_path)
         except Exception as e:
-            CustomUserWarning(f"Failed to process document: {e}")
+            UserMessage(f"Failed to process document: {e}")
             return None
-    def _handle_image_content(self, content: str) -> list:
+    def _handle_image_content(self, content: str) -> list[types.Part]:
         """Handle image content by processing and preparing google.generativeai.types.Part objects."""
-        image_parts = []
-        pattern = r'<<vision:(.*?):>>'
-        matches = re.findall(pattern, content) # re must be imported
-        for match in matches:
-            img_src = match.strip()
+        image_parts: list[types.Part] = []
+        for img_src in self._extract_image_sources(content):
             try:
-                if img_src.startswith('data:image'):
-                    header, encoded = img_src.split(',', 1)
-                    mime_type = header.split(';')[0].split(':')[1]
-                    image_bytes = base64.b64decode(encoded)
-                    image_parts.append(genai.types.Part(inline_data=genai.types.Blob(mime_type=mime_type, data=image_bytes)))
-                elif img_src.startswith('http://') or img_src.startswith('https://'):
-                    response = requests.get(img_src, timeout=10) # 10 seconds timeout
-                    response.raise_for_status()
-                    image_bytes = response.content
-                    mime_type = response.headers.get('Content-Type', 'application/octet-stream')
-                    if not mime_type.startswith('image/'):
-                        CustomUserWarning(f"URL content type '{mime_type}' does not appear to be an image for: {img_src}. Attempting to use anyway.")
-                    image_parts.append(genai.types.Part(inline_data=genai.types.Blob(mime_type=mime_type, data=image_bytes)))
-                elif img_src.startswith('frames:'):
-                    temp_path = img_src.replace('frames:', '')
-                    parts = temp_path.split(':', 1)
-                    if len(parts) != 2:
-                        CustomUserWarning(f"Invalid 'frames:' format: {img_src}")
-                        continue
-                    max_used_frames_str, actual_path = parts
-                    try:
-                        max_used_frames = int(max_used_frames_str)
-                    except ValueError:
-                        CustomUserWarning(f"Invalid max_frames number in 'frames:' format: {img_src}")
-                        continue
-                    frame_buffers, ext = encode_media_frames(actual_path)
-                    mime_type = f'image/{ext.lower()}' if ext else 'application/octet-stream'
-                    if ext and ext.lower() == 'jpg':
-                        mime_type = 'image/jpeg'
-                    if not frame_buffers:
-                        CustomUserWarning(f"encode_media_frames returned no frames for: {actual_path}")
-                        continue
-                    step = max(1, len(frame_buffers) // 50)
-                    indices = list(range(0, len(frame_buffers), step))[:max_used_frames]
-                    for i_idx in indices:
-                        if i_idx < len(frame_buffers):
-                           image_bytes = frame_buffers[i_idx]
-                           image_parts.append(genai.types.Part(inline_data=genai.types.Blob(mime_type=mime_type, data=image_bytes)))
-                else:
-                    # Handle local file paths
-                    local_file_path = Path(img_src)
-                    if not local_file_path.is_file():
-                        CustomUserWarning(f"Local image file not found: {img_src}")
-                        continue
-                    image_bytes = local_file_path.read_bytes()
-                    mime_type, _ = mimetypes.guess_type(local_file_path)
-                    if mime_type is None: # Fallback MIME type determination
-                        file_ext = local_file_path.suffix.lower().lstrip('.')
-                        if file_ext == 'jpg': mime_type = 'image/jpeg'
-                        elif file_ext == 'png': mime_type = 'image/png'
-                        elif file_ext == 'gif': mime_type = 'image/gif'
-                        elif file_ext == 'webp': mime_type = 'image/webp'
-                        else: mime_type = 'application/octet-stream'
-                    image_parts.append(genai.types.Part(inline_data=genai.types.Blob(mime_type=mime_type, data=image_bytes)))
+                image_parts.extend(self._create_parts_from_image_source(img_src))
             except Exception as e:
-                CustomUserWarning(f"Failed to process image source '{img_src}'. Error: {str(e)}", raise_with=ValueError)
+                UserMessage(
+                    f"Failed to process image source '{img_src}'. Error: {e!s}",
+                    raise_with=ValueError,
+                )
         return image_parts
+    def _extract_image_sources(self, content: str) -> list[str]:
+        pattern = r"<<vision:(.*?):>>"
+        return [match.strip() for match in re.findall(pattern, content)]
+    def _create_parts_from_image_source(self, img_src: str) -> list[types.Part]:
+        if img_src.startswith("data:image"):
+            return self._create_parts_from_data_uri(img_src)
+        if img_src.startswith(("http://", "https://")):
+            return self._create_parts_from_url(img_src)
+        if img_src.startswith("frames:"):
+            return self._create_parts_from_frames(img_src)
+        return self._create_parts_from_local_path(img_src)
+    def _create_parts_from_data_uri(self, img_src: str) -> list[types.Part]:
+        header, encoded = img_src.split(",", 1)
+        mime_type = header.split(";")[0].split(":")[1]
+        image_bytes = base64.b64decode(encoded)
+        part = genai.types.Part(inline_data=genai.types.Blob(mime_type=mime_type, data=image_bytes))
+        return [part]
+    def _create_parts_from_url(self, img_src: str) -> list[types.Part]:
+        response = requests.get(img_src, timeout=10)
+        response.raise_for_status()
+        image_bytes = response.content
+        mime_type = response.headers.get("Content-Type", "application/octet-stream")
+        if not mime_type.startswith("image/"):
+            UserMessage(
+                f"URL content type '{mime_type}' does not appear to be an image for: {img_src}. Attempting to use anyway."
+            )
+        part = genai.types.Part(inline_data=genai.types.Blob(mime_type=mime_type, data=image_bytes))
+        return [part]
+    def _create_parts_from_frames(self, img_src: str) -> list[types.Part]:
+        temp_path = img_src.replace("frames:", "")
+        parts = temp_path.split(":", 1)
+        if len(parts) != 2:
+            UserMessage(f"Invalid 'frames:' format: {img_src}")
+            return []
+        max_used_frames_str, actual_path = parts
+        try:
+            max_used_frames = int(max_used_frames_str)
+        except ValueError:
+            UserMessage(f"Invalid max_frames number in 'frames:' format: {img_src}")
+            return []
+        frame_buffers, ext = encode_media_frames(actual_path)
+        mime_type = f"image/{ext.lower()}" if ext else "application/octet-stream"
+        if ext and ext.lower() == "jpg":
+            mime_type = "image/jpeg"
+        if not frame_buffers:
+            UserMessage(f"encode_media_frames returned no frames for: {actual_path}")
+            return []
+        step = max(1, len(frame_buffers) // 50)
+        indices = list(range(0, len(frame_buffers), step))[:max_used_frames]
+        parts_list: list[types.Part] = []
+        for frame_idx in indices:
+            if frame_idx < len(frame_buffers):
+                image_bytes = frame_buffers[frame_idx]
+                parts_list.append(
+                    genai.types.Part(
+                        inline_data=genai.types.Blob(mime_type=mime_type, data=image_bytes)
+                    )
+                )
+        return parts_list
+    def _create_parts_from_local_path(self, img_src: str) -> list[types.Part]:
+        local_file_path = Path(img_src)
+        if not local_file_path.is_file():
+            UserMessage(f"Local image file not found: {img_src}")
+            return []
+        image_bytes = local_file_path.read_bytes()
+        mime_type, _ = mimetypes.guess_type(local_file_path)
+        if mime_type is None:
+            file_ext = local_file_path.suffix.lower().lstrip(".")
+            if file_ext == "jpg":
+                mime_type = "image/jpeg"
+            elif file_ext == "png":
+                mime_type = "image/png"
+            elif file_ext == "gif":
+                mime_type = "image/gif"
+            elif file_ext == "webp":
+                mime_type = "image/webp"
+            else:
+                mime_type = "application/octet-stream"
+        part = genai.types.Part(inline_data=genai.types.Blob(mime_type=mime_type, data=image_bytes))
+        return [part]
     def _handle_video_content(self, content: str):
         """Handle video content by uploading to Gemini"""
         try:
-            pattern = r'<<video:(.*?):>>'
+            pattern = r"<<video:(.*?):>>"
             matches = re.findall(pattern, content)
             if not matches:
                 return None
             video_path = matches[0].strip()
-            if video_path.startswith('http'):
-                CustomUserWarning("URL videos not yet supported for Gemini")
+            if video_path.startswith("http"):
+                UserMessage("URL videos not yet supported for Gemini")
                 return None
-            else:
-                # Upload local video
-                uploaded_file = genai.upload_file(video_path)
-                return uploaded_file
+            # Upload local video
+            return genai.upload_file(video_path)
         except Exception as e:
-            CustomUserWarning(f"Failed to process video: {e}")
+            UserMessage(f"Failed to process video: {e}")
             return None
     def _handle_audio_content(self, content: str):
         """Handle audio content by uploading to Gemini"""
         try:
-            pattern = r'<<audio:(.*?):>>'
+            pattern = r"<<audio:(.*?):>>"
             matches = re.findall(pattern, content)
             if not matches:
                 return None
             audio_path = matches[0].strip()
-            if audio_path.startswith('http'):
-                CustomUserWarning("URL audio not yet supported for Gemini")
+            if audio_path.startswith("http"):
+                UserMessage("URL audio not yet supported for Gemini")
                 return None
-            else:
-                # Upload local audio
-                uploaded_file = genai.upload_file(audio_path)
-                return uploaded_file
+            # Upload local audio
+            return genai.upload_file(audio_path)
         except Exception as e:
-            CustomUserWarning(f"Failed to process audio: {e}")
+            UserMessage(f"Failed to process audio: {e}")
             return None
     def _remove_media_patterns(self, text: str) -> str:
         """Remove media pattern markers from text"""
         patterns = [
-            r'<<vision:(.*?):>>',
-            r'<<video:(.*?):>>',
-            r'<<audio:(.*?):>>',
-            r'<<document:(.*?):>>'
+            r"<<vision:(.*?):>>",
+            r"<<video:(.*?):>>",
+            r"<<audio:(.*?):>>",
+            r"<<document:(.*?):>>",
         ]
         for pattern in patterns:
-            text = re.sub(pattern, '', text)
+            text = re.sub(pattern, "", text)
         return text
@@ -266,24 +274,24 @@ class GeminiXReasoningEngine(Engine, GoogleMixin):
         media_content = []
         # Process document content
-        if '<<document:' in processed_input_str:
+        if "<<document:" in processed_input_str:
             doc_file = self._handle_document_content(processed_input_str)
             if doc_file:
                 media_content.append(doc_file)
         # Process image content
-        if '<<vision:' in processed_input_str:
+        if "<<vision:" in processed_input_str:
             image_files = self._handle_image_content(processed_input_str)
             media_content.extend(image_files)
         # Process video content
-        if '<<video:' in processed_input_str:
+        if "<<video:" in processed_input_str:
             video_file = self._handle_video_content(processed_input_str)
             if video_file:
                 media_content.append(video_file)
         # Process audio content
-        if '<<audio:' in processed_input_str:
+        if "<<audio:" in processed_input_str:
             audio_file = self._handle_audio_content(processed_input_str)
             if audio_file:
                 media_content.append(audio_file)
@@ -295,277 +303,312 @@ class GeminiXReasoningEngine(Engine, GoogleMixin):
         thinking_content = ""
         text_content = ""
-        if hasattr(res, 'candidates') and res.candidates:
+        if hasattr(res, "candidates") and res.candidates:
             candidate = res.candidates[0]
-            if hasattr(candidate, 'content') and candidate.content:
+            if hasattr(candidate, "content") and candidate.content:
                 for part in candidate.content.parts:
-                    if hasattr(part, 'text') and part.text:
-                        if hasattr(part, 'thought') and part.thought:
+                    if hasattr(part, "text") and part.text:
+                        if hasattr(part, "thought") and part.thought:
                             thinking_content += part.text
                         else:
                             text_content += part.text
-        return {
-            "thinking": thinking_content,
-            "text": text_content
-        }
+        return {"thinking": thinking_content, "text": text_content}
     def forward(self, argument):
         kwargs = argument.kwargs
-        system, prompt = argument.prop.prepared_input
+        _system, prompt = argument.prop.prepared_input
         payload = self._prepare_request_payload(argument)
-        except_remedy = kwargs.get('except_remedy')
+        except_remedy = kwargs.get("except_remedy")
-        contents = []
-        for msg in prompt:
-            role = msg['role']
-            parts_list = msg['content']
-            contents.append(types.Content(role=role, parts=parts_list))
+        contents = self._build_contents_from_prompt(prompt)
         try:
-            generation_config = types.GenerateContentConfig(
-                max_output_tokens=payload.get('max_output_tokens'),
-                temperature=payload.get('temperature', 1.0),
-                top_p=payload.get('top_p', 0.95),
-                top_k=payload.get('top_k', 40),
-                stop_sequences=payload.get('stop_sequences'),
-                response_mime_type=payload.get('response_mime_type', 'text/plain'),
-            )
-            if payload.get('system_instruction'):
-                generation_config.system_instruction = payload['system_instruction']
-            if payload.get('thinking_config'):
-                generation_config.thinking_config = payload['thinking_config']
-            if payload.get('tools'):
-                generation_config.tools = payload['tools']
-                generation_config.automatic_function_calling=payload['automatic_function_calling']
-            res = self.client.models.generate_content(
-                model=kwargs.get('model', self.model),
-                contents=contents,
-                config=generation_config
-            )
+            generation_config = self._build_generation_config(payload)
+            res = self._generate_model_response(kwargs, contents, generation_config)
         except Exception as e:
-            if self.api_key is None or self.api_key == '':
-                msg = 'Google API key is not set. Please set it in the config file or pass it as an argument to the command method.'
-                logging.error(msg)
-                if self.config['NEUROSYMBOLIC_ENGINE_API_KEY'] is None or self.config['NEUROSYMBOLIC_ENGINE_API_KEY'] == '':
-                    CustomUserWarning(msg, raise_with=ValueError)
-                self.api_key = self.config['NEUROSYMBOLIC_ENGINE_API_KEY']
-                genai.configure(api_key=self.api_key)
-            if except_remedy is not None:
-                res = except_remedy(self, e, self.client.generate_content, argument)
-            else:
-                CustomUserWarning(f'Error during generation. Caused by: {e}', raise_with=ValueError)
+            res = self._handle_generation_error(e, except_remedy, argument)
-        metadata = {'raw_output': res}
-        if payload.get('tools'):
+        metadata = {"raw_output": res}
+        if payload.get("tools"):
             metadata = self._process_function_calls(res, metadata)
-        if kwargs.get('raw_output', False):
+        if kwargs.get("raw_output", False):
             return [res], metadata
         output = self._collect_response(res)
-        if output['thinking']:
-            metadata['thinking'] = output['thinking']
+        if output["thinking"]:
+            metadata["thinking"] = output["thinking"]
-        processed_text = output['text']
+        processed_text = output["text"]
         if argument.prop.response_format:
-            # Safely remove JSON markdown formatting if present
-            processed_text = processed_text.replace('```json', '').replace('```', '')
+            processed_text = processed_text.replace("```json", "").replace("```", "")
         return [processed_text], metadata
+    def _build_contents_from_prompt(self, prompt) -> list[types.Content]:
+        contents: list[types.Content] = []
+        for msg in prompt:
+            role = msg["role"]
+            parts_list = msg["content"]
+            contents.append(types.Content(role=role, parts=parts_list))
+        return contents
+    def _build_generation_config(self, payload: dict) -> types.GenerateContentConfig:
+        generation_config = types.GenerateContentConfig(
+            max_output_tokens=payload.get("max_output_tokens"),
+            temperature=payload.get("temperature", 1.0),
+            top_p=payload.get("top_p", 0.95),
+            top_k=payload.get("top_k", 40),
+            stop_sequences=payload.get("stop_sequences"),
+            response_mime_type=payload.get("response_mime_type", "text/plain"),
+        )
+        self._apply_optional_config_fields(generation_config, payload)
+        return generation_config
+    def _apply_optional_config_fields(
+        self, generation_config: types.GenerateContentConfig, payload: dict
+    ) -> None:
+        if payload.get("system_instruction"):
+            generation_config.system_instruction = payload["system_instruction"]
+        if payload.get("thinking_config"):
+            generation_config.thinking_config = payload["thinking_config"]
+        if payload.get("tools"):
+            generation_config.tools = payload["tools"]
+            generation_config.automatic_function_calling = payload["automatic_function_calling"]
+    def _generate_model_response(
+        self,
+        kwargs: dict,
+        contents: list[types.Content],
+        generation_config: types.GenerateContentConfig,
+    ):
+        return self.client.models.generate_content(
+            model=kwargs.get("model", self.model), contents=contents, config=generation_config
+        )
+    def _handle_generation_error(self, exception: Exception, except_remedy, argument):
+        if self.api_key is None or self.api_key == "":
+            msg = "Google API key is not set. Please set it in the config file or pass it as an argument to the command method."
+            UserMessage(msg)
+            if (
+                self.config["NEUROSYMBOLIC_ENGINE_API_KEY"] is None
+                or self.config["NEUROSYMBOLIC_ENGINE_API_KEY"] == ""
+            ):
+                UserMessage(msg, raise_with=ValueError)
+            self.api_key = self.config["NEUROSYMBOLIC_ENGINE_API_KEY"]
+            genai.configure(api_key=self.api_key)
+        if except_remedy is not None:
+            return except_remedy(self, exception, self.client.generate_content, argument)
+        UserMessage(f"Error during generation. Caused by: {exception}", raise_with=ValueError)
+        return None
     def _process_function_calls(self, res, metadata):
         hit = False
-        if hasattr(res, 'candidates') and res.candidates:
+        if hasattr(res, "candidates") and res.candidates:
             candidate = res.candidates[0]
-            if hasattr(candidate, 'content') and candidate.content:
+            if hasattr(candidate, "content") and candidate.content:
                 for part in candidate.content.parts:
-                    if hasattr(part, 'function_call') and part.function_call:
+                    if hasattr(part, "function_call") and part.function_call:
                         if hit:
-                            CustomUserWarning("Multiple function calls detected in the response but only the first one will be processed.")
+                            UserMessage(
+                                "Multiple function calls detected in the response but only the first one will be processed."
+                            )
                             break
                         func_call = part.function_call
-                        metadata['function_call'] = {
-                            'name': func_call.name,
-                            'arguments': func_call.args
+                        metadata["function_call"] = {
+                            "name": func_call.name,
+                            "arguments": func_call.args,
                         }
                         hit = True
         return metadata
     def _prepare_raw_input(self, argument):
         if not argument.prop.processed_input:
-            CustomUserWarning('Need to provide a prompt instruction to the engine if `raw_input` is enabled!', raise_with=ValueError)
+            UserMessage(
+                "Need to provide a prompt instruction to the engine if `raw_input` is enabled!",
+                raise_with=ValueError,
+            )
         raw_prompt_data = argument.prop.processed_input
-        messages_for_api = []
-        system_instruction = None
+        normalized_prompts = self._normalize_raw_prompt_data(raw_prompt_data)
+        system_instruction, non_system_messages = self._separate_system_instruction(
+            normalized_prompts
+        )
+        messages_for_api = self._build_raw_input_messages(non_system_messages)
+        return system_instruction, messages_for_api
+    def _normalize_raw_prompt_data(self, raw_prompt_data):
         if isinstance(raw_prompt_data, str):
-            normalized_prompts = [{'role': 'user', 'content': raw_prompt_data}]
-        elif isinstance(raw_prompt_data, dict):
-            normalized_prompts = [raw_prompt_data]
-        elif isinstance(raw_prompt_data, list):
+            return [{"role": "user", "content": raw_prompt_data}]
+        if isinstance(raw_prompt_data, dict):
+            return [raw_prompt_data]
+        if isinstance(raw_prompt_data, list):
             for item in raw_prompt_data:
                 if not isinstance(item, dict):
-                    CustomUserWarning(f"Invalid item in raw_input list: {item}. Expected dict.", raise_with=ValueError)
-            normalized_prompts = raw_prompt_data
-        else:
-            CustomUserWarning(f"Unsupported type for raw_input: {type(raw_prompt_data)}. Expected str, dict, or list of dicts.", raise_with=ValueError)
-        temp_non_system_messages = []
+                    UserMessage(
+                        f"Invalid item in raw_input list: {item}. Expected dict.",
+                        raise_with=ValueError,
+                    )
+            return raw_prompt_data
+        UserMessage(
+            f"Unsupported type for raw_input: {type(raw_prompt_data)}. Expected str, dict, or list of dicts.",
+            raise_with=ValueError,
+        )
+        return []
+    def _separate_system_instruction(self, normalized_prompts):
+        system_instruction = None
+        non_system_messages = []
         for msg in normalized_prompts:
-            role = msg.get('role')
-            content = msg.get('content')
+            role = msg.get("role")
+            content = msg.get("content")
             if role is None or content is None:
-                CustomUserWarning(f"Message in raw_input is missing 'role' or 'content': {msg}", raise_with=ValueError)
+                UserMessage(
+                    f"Message in raw_input is missing 'role' or 'content': {msg}",
+                    raise_with=ValueError,
+                )
             if not isinstance(content, str):
-                CustomUserWarning(f"Message content for role '{role}' in raw_input must be a string. Found type: {type(content)} for content: {content}", raise_with=ValueError)
-            if role == 'system':
+                UserMessage(
+                    f"Message content for role '{role}' in raw_input must be a string. Found type: {type(content)} for content: {content}",
+                    raise_with=ValueError,
+                )
+            if role == "system":
                 if system_instruction is not None:
-                    CustomUserWarning('Only one system instruction is allowed in raw_input mode!', raise_with=ValueError)
+                    UserMessage(
+                        "Only one system instruction is allowed in raw_input mode!",
+                        raise_with=ValueError,
+                    )
                 system_instruction = content
             else:
-                temp_non_system_messages.append({'role': role, 'content': content})
-        for msg in temp_non_system_messages:
-            content_str = str(msg.get('content', ''))
+                non_system_messages.append({"role": role, "content": content})
+        return system_instruction, non_system_messages
+    def _build_raw_input_messages(self, messages):
+        messages_for_api = []
+        for msg in messages:
+            content_str = str(msg.get("content", ""))
             current_message_api_parts: list[types.Part] = []
             image_api_parts = self._handle_image_content(content_str)
             if image_api_parts:
                 current_message_api_parts.extend(image_api_parts)
             text_only_content = self._remove_media_patterns(content_str)
             if text_only_content:
                 current_message_api_parts.append(types.Part(text=text_only_content))
             if current_message_api_parts:
-                messages_for_api.append({
-                    'role': msg['role'],
-                    'content': current_message_api_parts
-                })
-        return system_instruction, messages_for_api
+                messages_for_api.append({"role": msg["role"], "content": current_message_api_parts})
+        return messages_for_api
     def prepare(self, argument):
-        #@NOTE: OpenAI compatibility at high level
+        # @NOTE: OpenAI compatibility at high level
         if argument.prop.raw_input:
             argument.prop.prepared_input = self._prepare_raw_input(argument)
             return
-        _non_verbose_output = """<META_INSTRUCTION/>\nYou do not output anything else, like verbose preambles or post explanation, such as "Sure, let me...", "Hope that was helpful...", "Yes, I can help you with that...", etc. Consider well formatted output, e.g. for sentences use punctuation, spaces etc. or for code use indentation, etc. Never add meta instructions information to your output!\n\n"""
+        processed_input_str = str(argument.prop.processed_input)
+        media_content = self._process_multimodal_content(processed_input_str)
+        system_content = self._compose_system_content(argument)
+        user_content = self._compose_user_content(argument)
+        system_content, user_content = self._apply_self_prompt_if_needed(
+            argument, system_content, user_content
+        )
-        user_content = ""
-        system_content = ""
+        user_prompt = self._build_user_prompt(media_content, user_content)
+        argument.prop.prepared_input = (system_content, [user_prompt])
+    def _compose_system_content(self, argument) -> str:
+        system_content = ""
+        _non_verbose_output = """<META_INSTRUCTION/>\nYou do not output anything else, like verbose preambles or post explanation, such as "Sure, let me...", "Hope that was helpful...", "Yes, I can help you with that...", etc. Consider well formatted output, e.g. for sentences use punctuation, spaces etc. or for code use indentation, etc. Never add meta instructions information to your output!\n\n"""
         if argument.prop.suppress_verbose_output:
             system_content += _non_verbose_output
-        system_content = f'{system_content}\n' if system_content and len(system_content) > 0 else ''
+        system_content = f"{system_content}\n" if system_content and len(system_content) > 0 else ""
         if argument.prop.response_format:
-            _rsp_fmt = argument.prop.response_format
-            assert _rsp_fmt.get('type') is not None, 'Response format type is required!'
-            if _rsp_fmt["type"] == "json_object":
-                system_content += f'<RESPONSE_FORMAT/>\nYou are a helpful assistant designed to output JSON.\n\n'
+            response_format = argument.prop.response_format
+            assert response_format.get("type") is not None, "Response format type is required!"
+            if response_format["type"] == "json_object":
+                system_content += (
+                    "<RESPONSE_FORMAT/>\nYou are a helpful assistant designed to output JSON.\n\n"
+                )
         ref = argument.prop.instance
         static_ctxt, dyn_ctxt = ref.global_context
         if len(static_ctxt) > 0:
             system_content += f"<STATIC_CONTEXT/>\n{static_ctxt}\n\n"
         if len(dyn_ctxt) > 0:
             system_content += f"<DYNAMIC_CONTEXT/>\n{dyn_ctxt}\n\n"
         payload = argument.prop.payload
         if argument.prop.payload:
-            system_content += f"<ADDITIONAL_CONTEXT/>\n{str(payload)}\n\n"
+            system_content += f"<ADDITIONAL_CONTEXT/>\n{payload!s}\n\n"
         examples: list[str] = argument.prop.examples
         if examples and len(examples) > 0:
-            system_content += f"<EXAMPLES/>\n{str(examples)}\n\n"
-        # Handle multimodal content
-        processed_input_str = str(argument.prop.processed_input)
-        media_content = self._process_multimodal_content(processed_input_str)
+            system_content += f"<EXAMPLES/>\n{examples!s}\n\n"
         if argument.prop.prompt is not None and len(argument.prop.prompt) > 0:
             val = str(argument.prop.prompt)
             val = self._remove_media_patterns(val)
             system_content += f"<INSTRUCTION/>\n{val}\n\n"
+        if argument.prop.template_suffix:
+            system_content += f" You will only generate content for the placeholder `{argument.prop.template_suffix!s}` following the instructions and the provided context information.\n\n"
+        return system_content
+    def _compose_user_content(self, argument) -> str:
         suffix = str(argument.prop.processed_input)
         suffix = self._remove_media_patterns(suffix)
-        user_content += f"{suffix}"
+        return f"{suffix}"
-        if argument.prop.template_suffix:
-            system_content += f' You will only generate content for the placeholder `{str(argument.prop.template_suffix)}` following the instructions and the provided context information.\n\n'
-        # Handle self-prompting
-        if argument.prop.instance._kwargs.get('self_prompt', False) or argument.prop.self_prompt:
+    def _apply_self_prompt_if_needed(self, argument, system_content: str, user_content: str):
+        if argument.prop.instance._kwargs.get("self_prompt", False) or argument.prop.self_prompt:
             self_prompter = SelfPrompt()
             res = self_prompter(
-                {'user': user_content, 'system': system_content},
-                max_tokens=argument.kwargs.get('max_tokens', self.max_response_tokens),
-                thinking=argument.kwargs.get('thinking', None),
+                {"user": user_content, "system": system_content},
+                max_tokens=argument.kwargs.get("max_tokens", self.max_response_tokens),
+                thinking=argument.kwargs.get("thinking", None),
             )
             if res is None:
-                CustomUserWarning("Self-prompting failed!", raise_with=ValueError)
+                UserMessage("Self-prompting failed!", raise_with=ValueError)
+            user_content = res["user"]
+            system_content = res["system"]
+        return system_content, user_content
-            user_content = res['user']
-            system_content = res['system']
-        all_user_content = []
-        all_user_content.extend(media_content) #
+    def _build_user_prompt(self, media_content, user_content: str) -> dict:
+        all_user_content = list(media_content)
         if user_content.strip():
             all_user_content.append(genai.types.Part(text=user_content.strip()))
         if not all_user_content:
             all_user_content = [genai.types.Part(text="N/A")]
-        user_prompt = {'role': 'user', 'content': all_user_content}
-        argument.prop.prepared_input = (system_content, [user_prompt])
+        return {"role": "user", "content": all_user_content}
     def _prepare_request_payload(self, argument):
         kwargs = argument.kwargs
         payload = {
-            "max_output_tokens": kwargs.get('max_tokens', self.max_response_tokens),
-            "temperature": kwargs.get('temperature', 1.0),
-            "top_p": kwargs.get('top_p', 0.95),
-            "top_k": kwargs.get('top_k', 40),
-            "stop_sequences": kwargs.get('stop', None),
-            "stream": kwargs.get('stream', False),
+            "max_output_tokens": kwargs.get("max_tokens", self.max_response_tokens),
+            "temperature": kwargs.get("temperature", 1.0),
+            "top_p": kwargs.get("top_p", 0.95),
+            "top_k": kwargs.get("top_k", 40),
+            "stop_sequences": kwargs.get("stop", None),
+            "stream": kwargs.get("stream", False),
         }
         system, _ = argument.prop.prepared_input
         if system and system.strip():
-            payload['system_instruction'] = system.strip()
+            payload["system_instruction"] = system.strip()
-        thinking_arg = kwargs.get('thinking', None)
+        thinking_arg = kwargs.get("thinking", None)
         if thinking_arg and isinstance(thinking_arg, dict):
             thinking_budget = thinking_arg.get("thinking_budget", 1024)
-            payload['thinking_config'] = types.ThinkingConfig(include_thoughts=True, thinking_budget=thinking_budget)
+            payload["thinking_config"] = types.ThinkingConfig(
+                include_thoughts=True, thinking_budget=thinking_budget
+            )
-        response_format = kwargs.get('response_format', None)
-        if response_format and response_format.get('type') == 'json_object':
-            payload['response_mime_type'] = 'application/json'
+        response_format = kwargs.get("response_format", None)
+        if response_format and response_format.get("type") == "json_object":
+            payload["response_mime_type"] = "application/json"
-        tools = kwargs.get('tools')
+        tools = kwargs.get("tools")
         if tools:
-            payload['tools'] = self._convert_tools_format(tools)
-            payload['automatic_function_calling'] = types.AutomaticFunctionCallingConfig(
-                disable=kwargs.get('automatic_function_calling', True)
+            payload["tools"] = self._convert_tools_format(tools)
+            payload["automatic_function_calling"] = types.AutomaticFunctionCallingConfig(
+                disable=kwargs.get("automatic_function_calling", True)
             )
         return payload
@@ -584,7 +627,9 @@ class GeminiXReasoningEngine(Engine, GoogleMixin):
             elif isinstance(tool_item, types.FunctionDeclaration):
                 processed_tools.append(types.Tool(function_declarations=[tool_item]))
             else:
-                CustomUserWarning(f"Ignoring invalid tool format. Expected a callable, google.genai.types.Tool, or google.genai.types.FunctionDeclaration: {tool_item}")
+                UserMessage(
+                    f"Ignoring invalid tool format. Expected a callable, google.genai.types.Tool, or google.genai.types.FunctionDeclaration: {tool_item}"
+                )
         if not processed_tools:
             return None

symbolicai 0.21.0__py3-none-any.whl → 1.1.0__py3-none-any.whl

symbolicai 0.21.0py3-none-any.whl → 1.1.0py3-none-any.whl