PyPI - symbolicai - Versions diffs - 0.21.0__py3-none-any.whl → 1.1.0__py3-none-any.whl - Mend

symbolicai 0.21.0py3-none-any.whl → 1.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (134) hide show

symai/__init__.py +269 -173
symai/backend/base.py +123 -110
symai/backend/engines/drawing/engine_bfl.py +45 -44
symai/backend/engines/drawing/engine_gpt_image.py +112 -97
symai/backend/engines/embedding/engine_llama_cpp.py +63 -52
symai/backend/engines/embedding/engine_openai.py +25 -21
symai/backend/engines/execute/engine_python.py +19 -18
symai/backend/engines/files/engine_io.py +104 -95
symai/backend/engines/imagecaptioning/engine_blip2.py +28 -24
symai/backend/engines/imagecaptioning/engine_llavacpp_client.py +102 -79
symai/backend/engines/index/engine_pinecone.py +124 -97
symai/backend/engines/index/engine_qdrant.py +1011 -0
symai/backend/engines/index/engine_vectordb.py +84 -56
symai/backend/engines/lean/engine_lean4.py +96 -52
symai/backend/engines/neurosymbolic/__init__.py +41 -13
symai/backend/engines/neurosymbolic/engine_anthropic_claudeX_chat.py +330 -248
symai/backend/engines/neurosymbolic/engine_anthropic_claudeX_reasoning.py +329 -264
symai/backend/engines/neurosymbolic/engine_cerebras.py +328 -0
symai/backend/engines/neurosymbolic/engine_deepseekX_reasoning.py +118 -88
symai/backend/engines/neurosymbolic/engine_google_geminiX_reasoning.py +344 -299
symai/backend/engines/neurosymbolic/engine_groq.py +173 -115
symai/backend/engines/neurosymbolic/engine_huggingface.py +114 -84
symai/backend/engines/neurosymbolic/engine_llama_cpp.py +144 -118
symai/backend/engines/neurosymbolic/engine_openai_gptX_chat.py +415 -307
symai/backend/engines/neurosymbolic/engine_openai_gptX_reasoning.py +394 -231
symai/backend/engines/ocr/engine_apilayer.py +23 -27
symai/backend/engines/output/engine_stdout.py +10 -13
symai/backend/engines/{webscraping → scrape}/engine_requests.py +101 -54
symai/backend/engines/search/engine_openai.py +100 -88
symai/backend/engines/search/engine_parallel.py +665 -0
symai/backend/engines/search/engine_perplexity.py +44 -45
symai/backend/engines/search/engine_serpapi.py +37 -34
symai/backend/engines/speech_to_text/engine_local_whisper.py +54 -51
symai/backend/engines/symbolic/engine_wolframalpha.py +15 -9
symai/backend/engines/text_to_speech/engine_openai.py +20 -26
symai/backend/engines/text_vision/engine_clip.py +39 -37
symai/backend/engines/userinput/engine_console.py +5 -6
symai/backend/mixin/__init__.py +13 -0
symai/backend/mixin/anthropic.py +48 -38
symai/backend/mixin/deepseek.py +6 -5
symai/backend/mixin/google.py +7 -4
symai/backend/mixin/groq.py +2 -4
symai/backend/mixin/openai.py +140 -110
symai/backend/settings.py +87 -20
symai/chat.py +216 -123
symai/collect/__init__.py +7 -1
symai/collect/dynamic.py +80 -70
symai/collect/pipeline.py +67 -51
symai/collect/stats.py +161 -109
symai/components.py +707 -360
symai/constraints.py +24 -12
symai/core.py +1857 -1233
symai/core_ext.py +83 -80
symai/endpoints/api.py +166 -104
symai/extended/.DS_Store +0 -0
symai/extended/__init__.py +46 -12
symai/extended/api_builder.py +29 -21
symai/extended/arxiv_pdf_parser.py +23 -14
symai/extended/bibtex_parser.py +9 -6
symai/extended/conversation.py +156 -126
symai/extended/document.py +50 -30
symai/extended/file_merger.py +57 -14
symai/extended/graph.py +51 -32
symai/extended/html_style_template.py +18 -14
symai/extended/interfaces/blip_2.py +2 -3
symai/extended/interfaces/clip.py +4 -3
symai/extended/interfaces/console.py +9 -1
symai/extended/interfaces/dall_e.py +4 -2
symai/extended/interfaces/file.py +2 -0
symai/extended/interfaces/flux.py +4 -2
symai/extended/interfaces/gpt_image.py +16 -7
symai/extended/interfaces/input.py +2 -1
symai/extended/interfaces/llava.py +1 -2
symai/extended/interfaces/{naive_webscraping.py → naive_scrape.py} +4 -3
symai/extended/interfaces/naive_vectordb.py +9 -10
symai/extended/interfaces/ocr.py +5 -3
symai/extended/interfaces/openai_search.py +2 -0
symai/extended/interfaces/parallel.py +30 -0
symai/extended/interfaces/perplexity.py +2 -0
symai/extended/interfaces/pinecone.py +12 -9
symai/extended/interfaces/python.py +2 -0
symai/extended/interfaces/serpapi.py +3 -1
symai/extended/interfaces/terminal.py +2 -4
symai/extended/interfaces/tts.py +3 -2
symai/extended/interfaces/whisper.py +3 -2
symai/extended/interfaces/wolframalpha.py +2 -1
symai/extended/metrics/__init__.py +11 -1
symai/extended/metrics/similarity.py +14 -13
symai/extended/os_command.py +39 -29
symai/extended/packages/__init__.py +29 -3
symai/extended/packages/symdev.py +51 -43
symai/extended/packages/sympkg.py +41 -35
symai/extended/packages/symrun.py +63 -50
symai/extended/repo_cloner.py +14 -12
symai/extended/seo_query_optimizer.py +15 -13
symai/extended/solver.py +116 -91
symai/extended/summarizer.py +12 -10
symai/extended/taypan_interpreter.py +17 -18
symai/extended/vectordb.py +122 -92
symai/formatter/__init__.py +9 -1
symai/formatter/formatter.py +51 -47
symai/formatter/regex.py +70 -69
symai/functional.py +325 -176
symai/imports.py +190 -147
symai/interfaces.py +57 -28
symai/memory.py +45 -35
symai/menu/screen.py +28 -19
symai/misc/console.py +66 -56
symai/misc/loader.py +8 -5
symai/models/__init__.py +17 -1
symai/models/base.py +395 -236
symai/models/errors.py +1 -2
symai/ops/__init__.py +32 -22
symai/ops/measures.py +24 -25
symai/ops/primitives.py +1149 -731
symai/post_processors.py +58 -50
symai/pre_processors.py +86 -82
symai/processor.py +21 -13
symai/prompts.py +764 -685
symai/server/huggingface_server.py +135 -49
symai/server/llama_cpp_server.py +21 -11
symai/server/qdrant_server.py +206 -0
symai/shell.py +100 -42
symai/shellsv.py +700 -492
symai/strategy.py +630 -346
symai/symbol.py +368 -322
symai/utils.py +100 -78
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/METADATA +22 -10
symbolicai-1.1.0.dist-info/RECORD +168 -0
symbolicai-0.21.0.dist-info/RECORD +0 -162
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/WHEEL +0 -0
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/entry_points.txt +0 -0
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/licenses/LICENSE +0 -0
{symbolicai-0.21.0.dist-info → symbolicai-1.1.0.dist-info}/top_level.txt +0 -0

symai/backend/engines/files/engine_io.py CHANGED Viewed

@@ -1,5 +1,5 @@
+import contextlib
 import logging
-import os
 from dataclasses import dataclass
 from pathlib import Path
@@ -7,21 +7,60 @@ import pypdf
 import tika
 from tika import unpack
+from ....utils import UserMessage
 from ...base import Engine
 # Initialize Tika lazily to avoid spawning JVMs prematurely for all workers
-_TIKA_INITIALIZED = False
+_TIKA_STATE = {"initialized": False}
 def _ensure_tika_vm():
-    global _TIKA_INITIALIZED
-    if not _TIKA_INITIALIZED:
-        try:
+    if not _TIKA_STATE["initialized"]:
+        with contextlib.suppress(Exception):
             tika.initVM()
-        except Exception:
-            # If initVM fails, we still attempt unpack.from_file which may auto-init
-            pass
-        logging.getLogger('tika').setLevel(logging.CRITICAL)
-        _TIKA_INITIALIZED = True
+        logging.getLogger("tika").setLevel(logging.CRITICAL)
+        _TIKA_STATE["initialized"] = True
+def _int_or_none(value):
+    return int(value) if value != "" else None
+def _parse_slice_token(token):
+    if ":" not in token:
+        return int(token)
+    parts = token.split(":")
+    if len(parts) == 2:
+        start, end = parts
+        return slice(_int_or_none(start), _int_or_none(end), None)
+    if len(parts) == 3:
+        start, end, step = parts
+        return slice(_int_or_none(start), _int_or_none(end), _int_or_none(step))
+    return None
+def _parse_slice_spec(file_path):
+    if "[" not in file_path or "]" not in file_path:
+        return file_path, None
+    path_part, remainder = file_path.split("[", 1)
+    slice_section = remainder.split("]", 1)[0]
+    slices = []
+    for token in slice_section.split(","):
+        if token == "":
+            continue
+        parsed = _parse_slice_token(token)
+        if parsed is not None:
+            slices.append(parsed)
+    return path_part, slices or None
+def _apply_slices(lines, slices_):
+    if slices_ is None:
+        return lines
+    new_content = []
+    for slice_item in slices_:
+        new_content.extend(lines[slice_item])
+    return new_content
 @dataclass
@@ -37,97 +76,67 @@ class FileEngine(Engine):
         self.name = self.__class__.__name__
     def id(self) -> str:
-        return 'files'
+        return "files"
     def _read_slice_file(self, file_path, argument):
         # check if file is empty
-        with_metadata = argument.kwargs.get('with_metadata', False)
-        id            = Path(argument.prop.prepared_input).stem.replace(' ', '_')
-        if file_path is None or file_path.strip() == '':
+        with_metadata = argument.kwargs.get("with_metadata", False)
+        file_id = Path(argument.prop.prepared_input).stem.replace(" ", "_")
+        if file_path is None or file_path.strip() == "":
             return None
         # check if file slice is used
-        slices_ = None
-        if '[' in file_path and ']' in file_path:
-            file_parts = file_path.split('[')
-            file_path = file_parts[0]
-            # remove string up to '[' and after ']'
-            slices_s = file_parts[1].split(']')[0].split(',')
-            slices_ = []
-            for s in slices_s:
-                if s == '':
-                    continue
-                elif ':' in s:
-                    s_split = s.split(':')
-                    if len(s_split) == 2:
-                        start_slice = int(s_split[0]) if s_split[0] != '' else None
-                        end_slice = int(s_split[1]) if s_split[1] != '' else None
-                        slices_.append(slice(start_slice, end_slice, None))
-                    elif len(s_split) == 3:
-                        start_slice = int(s_split[0]) if s_split[0] != '' else None
-                        end_slice = int(s_split[1]) if s_split[1] != '' else None
-                        step_slice = int(s_split[2]) if s_split[2] != '' else None
-                        slices_.append(slice(start_slice, end_slice, step_slice))
-                else:
-                    slices_.append(int(s))
+        file_path, slices_ = _parse_slice_spec(file_path)
+        path_obj = Path(file_path)
         # check if file exists
-        assert os.path.exists(file_path), f'File does not exist: {file_path}'
+        assert path_obj.exists(), f"File does not exist: {file_path}"
         # verify if file is empty
-        if os.path.getsize(file_path) <= 0:
-            return ''
+        if path_obj.stat().st_size <= 0:
+            return ""
         # For common plain-text extensions, avoid Tika overhead
-        ext = Path(file_path).suffix.lower()
-        if ext in {'.txt', '.md', '.py', '.json', '.yaml', '.yml', '.csv', '.tsv', '.log'}:
+        ext = path_obj.suffix.lower()
+        if ext in {".txt", ".md", ".py", ".json", ".yaml", ".yml", ".csv", ".tsv", ".log"}:
             try:
-                with open(file_path, 'r', encoding='utf-8', errors='ignore') as f:
+                with path_obj.open(encoding="utf-8", errors="ignore") as f:
                     content = f.read()
                 if content is None:
                     return None
                 # Apply slicing by lines, mirroring the Tika branch
-                lines = content.split('\n')
-                if slices_ is not None:
-                    new_content = []
-                    for s in slices_:
-                        new_content.extend(lines[s])
-                    lines = new_content
-                content = '\n'.join(lines)
-                content = content.encode('utf8', 'ignore').decode('utf8', 'ignore')
-                return content if not with_metadata else [TextContainer(id, None, content)]
+                lines = content.split("\n")
+                lines = _apply_slices(lines, slices_)
+                content = "\n".join(lines)
+                content = content.encode("utf8", "ignore").decode("utf8", "ignore")
+                return content if not with_metadata else [TextContainer(file_id, None, content)]
             except Exception:
                 # Fallback to Tika if plain read fails
                 pass
         _ensure_tika_vm()
-        file_ = unpack.from_file(str(file_path))
-        if 'content' in file_:
-            content = file_['content']
-        else:
-            content = str(file_)
+        file_ = unpack.from_file(str(path_obj))
+        content = file_["content"] if "content" in file_ else str(file_)
         if content is None:
             return None
-        content = content.split('\n')
-        if slices_ is not None:
-            new_content = []
-            for s in slices_:
-                new_content.extend(content[s])
-            content = new_content
-        content = '\n'.join(content)
-        content = content.encode('utf8', 'ignore').decode('utf8', 'ignore')
-        return content if not with_metadata else [TextContainer(id, None, content)]
+        content = content.split("\n")
+        content = _apply_slices(content, slices_)
+        content = "\n".join(content)
+        content = content.encode("utf8", "ignore").decode("utf8", "ignore")
+        return content if not with_metadata else [TextContainer(file_id, None, content)]
     def reset_eof_of_pdf_return_stream(self, pdf_stream_in: list):
         actual_line = len(pdf_stream_in)  # Predefined value in case EOF not found
         # find the line position of the EOF
         for i, x in enumerate(pdf_stream_in[::-1]):
-            if b'%%EOF' in x:
-                actual_line = len(pdf_stream_in)-i
-                print(f'EOF found at line position {-i} = actual {actual_line}, with value {x}')
+            if b"%%EOF" in x:
+                actual_line = len(pdf_stream_in) - i
+                UserMessage(
+                    f"EOF found at line position {-i} = actual {actual_line}, with value {x}"
+                )
                 break
         # return the list up to that point
@@ -135,56 +144,56 @@ class FileEngine(Engine):
     def fix_pdf(self, file_path: str):
         # opens the file for reading
-        with open(file_path, 'rb') as p:
-            txt = (p.readlines())
+        path_obj = Path(file_path)
+        with path_obj.open("rb") as p:
+            txt = p.readlines()
         # get the new list terminating correctly
         txtx = self.reset_eof_of_pdf_return_stream(txt)
         # write to new pdf
-        new_file_path = f'{file_path}_fixed.pdf'
-        with open(new_file_path, 'wb') as f:
+        new_file_path = Path(f"{file_path}_fixed.pdf")
+        with new_file_path.open("wb") as f:
             f.writelines(txtx)
-        fixed_pdf = pypdf.PdfReader(new_file_path)
-        return fixed_pdf
+        return pypdf.PdfReader(str(new_file_path))
     def read_text(self, pdf_reader, page_range, argument):
         txt = []
-        n_pages  = len(pdf_reader.pages)
-        with_metadata = argument.kwargs.get('with_metadata', False)
-        id       = Path(argument.prop.prepared_input).stem.replace(' ', '_')
+        n_pages = len(pdf_reader.pages)
+        with_metadata = argument.kwargs.get("with_metadata", False)
+        file_id = Path(argument.prop.prepared_input).stem.replace(" ", "_")
         for i in range(n_pages)[slice(0, n_pages) if page_range is None else page_range]:
             page = pdf_reader.pages[i]
             extracted = page.extract_text()
-            extracted = extracted.encode('utf8', 'ignore').decode('utf8', 'ignore')
+            extracted = extracted.encode("utf8", "ignore").decode("utf8", "ignore")
             if with_metadata:
-                txt.append(TextContainer(id, str(i), extracted))
+                txt.append(TextContainer(file_id, str(i), extracted))
             else:
                 txt.append(extracted)
-        return '\n'.join(txt) if not with_metadata else txt
+        return "\n".join(txt) if not with_metadata else txt
     def forward(self, argument):
-        kwargs        = argument.kwargs
-        path          = argument.prop.prepared_input
+        kwargs = argument.kwargs
+        path = argument.prop.prepared_input
-        if '.pdf' in path:
+        if ".pdf" in path:
             page_range = None
-            if 'slice' in kwargs:
-                page_range = kwargs['slice']
-                if isinstance(page_range, tuple) or isinstance(page_range, list):
+            if "slice" in kwargs:
+                page_range = kwargs["slice"]
+                if isinstance(page_range, (tuple, list)):
                     page_range = slice(*page_range)
-            rsp = ''
+            rsp = ""
             try:
-                with open(str(path), 'rb') as f:
+                with Path(path).open("rb") as f:
                     # creating a pdf reader object
                     pdf_reader = pypdf.PdfReader(f)
                     rsp = self.read_text(pdf_reader, page_range, argument)
             except Exception as e:
-                print(f'Error reading PDF: {e} | {path}')
-                if 'fix_pdf' not in kwargs or not kwargs['fix_pdf']:
+                UserMessage(f"Error reading PDF: {e} | {path}")
+                if "fix_pdf" not in kwargs or not kwargs["fix_pdf"]:
                     raise e
                 fixed_pdf = self.fix_pdf(str(path))
                 pdf_reader_fixed = pypdf.PdfReader(fixed_pdf)
@@ -193,11 +202,11 @@ class FileEngine(Engine):
             try:
                 rsp = self._read_slice_file(path, argument)
             except Exception as e:
-                print(f'Error reading empty file: {e} | {path}')
+                UserMessage(f"Error reading empty file: {e} | {path}")
                 raise e
         if rsp is None:
-            raise Exception(f'Error reading file - empty result: {path}')
+            UserMessage(f"Error reading file - empty result: {path}", raise_with=Exception)
         metadata = {}
@@ -206,5 +215,5 @@ class FileEngine(Engine):
     def prepare(self, argument):
         assert not argument.prop.processed_input, "FileEngine does not support processed_input."
         path = argument.prop.path
-        path = path.replace('\\', '')
+        path = path.replace("\\", "")
         argument.prop.prepared_input = path

symai/backend/engines/imagecaptioning/engine_blip2.py CHANGED Viewed

@@ -1,5 +1,3 @@
-from typing import List
 import requests
 import torch
@@ -10,6 +8,7 @@ except ImportError:
 from PIL import Image
+from ....utils import UserMessage
 from ...base import Engine
 from ...settings import SYMAI_CONFIG
@@ -18,7 +17,7 @@ class Blip2Engine(Engine):
     def __init__(self):
         super().__init__()
         self.config = SYMAI_CONFIG
-        ids = self.config['CAPTION_ENGINE_MODEL'].split('/')
+        ids = self.config["CAPTION_ENGINE_MODEL"].split("/")
         if len(ids) != 2:
             # return unregistered engine
             return
@@ -27,42 +26,47 @@ class Blip2Engine(Engine):
         self.model = None  # lazy loading
         self.vis_processors = None  # lazy loading
         self.txt_processors = None  # lazy loading
-        self.device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+        self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         self.name = self.__class__.__name__
     def id(self) -> str:
-        if  self.config['CAPTION_ENGINE_MODEL'] and \
-            'blip2' in self.config['CAPTION_ENGINE_MODEL']:
-            return 'imagecaptioning'
-        return super().id() # default to unregistered
+        if self.config["CAPTION_ENGINE_MODEL"] and "blip2" in self.config["CAPTION_ENGINE_MODEL"]:
+            return "imagecaptioning"
+        return super().id()  # default to unregistered
     def command(self, *args, **kwargs):
         super().command(*args, **kwargs)
-        if 'CAPTION_ENGINE_MODEL' in kwargs:
-            self.model_id = kwargs['CAPTION_ENGINE_MODEL']
+        if "CAPTION_ENGINE_MODEL" in kwargs:
+            self.model_id = kwargs["CAPTION_ENGINE_MODEL"]
     def forward(self, argument):
         if load_model_and_preprocess is None:
-            raise ImportError('Blip2 is not installed. Please install it with `pip install symbolicai[blip2]`')
+            UserMessage(
+                "Blip2 is not installed. Please install it with `pip install symbolicai[blip2]`",
+                raise_with=ImportError,
+            )
         if self.model is None:
-            self.model, self.vis_processors, self.txt_processors  = load_model_and_preprocess(name       = self.name_id,
-                                                                                              model_type = self.model_id,
-                                                                                              is_eval    = True,
-                                                                                              device     = self.device)
+            self.model, self.vis_processors, self.txt_processors = load_model_and_preprocess(
+                name=self.name_id, model_type=self.model_id, is_eval=True, device=self.device
+            )
         image, prompt = argument.prop.prepared_input
-        kwargs        = argument.kwargs
-        except_remedy = kwargs['except_remedy'] if 'except_remedy' in kwargs else None
+        kwargs = argument.kwargs
+        except_remedy = kwargs.get("except_remedy")
-        if 'http' in image:
-            image = Image.open(requests.get(image, stream=True).raw).convert('RGB')
-        elif '/' in image or '\\' in image:
-            image = Image.open(image).convert('RGB')
+        if "http" in image:
+            image = Image.open(requests.get(image, stream=True).raw).convert("RGB")
+        elif "/" in image or "\\" in image:
+            image = Image.open(image).convert("RGB")
         try:
-            image   = self.vis_processors['eval'](image).unsqueeze(0).to(self.device)
-            prompt  = self.txt_processors['eval'](prompt)
-            res     = self.model.generate(samples={"image": image, "prompt": prompt}, use_nucleus_sampling=True, num_captions=3)
+            image = self.vis_processors["eval"](image).unsqueeze(0).to(self.device)
+            prompt = self.txt_processors["eval"](prompt)
+            res = self.model.generate(
+                samples={"image": image, "prompt": prompt},
+                use_nucleus_sampling=True,
+                num_captions=3,
+            )
         except Exception as e:
             if except_remedy is None:
                 raise e

symai/backend/engines/imagecaptioning/engine_llavacpp_client.py CHANGED Viewed

@@ -1,48 +1,48 @@
-import logging
-import requests
-import json
 import io
+import json
+import logging
+from pathlib import Path
-from typing import List
-from requests_toolbelt.multipart.encoder import MultipartEncoder
+import requests
 from PIL.Image import Image
+from requests_toolbelt.multipart.encoder import MultipartEncoder
+from ....symbol import Result
+from ....utils import UserMessage
 from ...base import Engine
 from ...settings import SYMAI_CONFIG
-from ....symbol import Result
-def image_to_byte_array(image: Image, format='PNG') -> bytes:
-  # BytesIO is a file-like buffer stored in memory
-  imgByteArr = io.BytesIO()
-  # image.save expects a file-like as a argument
-  image.save(imgByteArr, format=format)
-  # Turn the BytesIO object back into a bytes object
-  imgByteArr = imgByteArr.getvalue()
-  return imgByteArr
+def image_to_byte_array(image: Image, format="PNG") -> bytes:
+    # BytesIO is a file-like buffer stored in memory
+    imgByteArr = io.BytesIO()
+    # image.save expects a file-like as a argument
+    image.save(imgByteArr, format=format)
+    # Turn the BytesIO object back into a bytes object
+    return imgByteArr.getvalue()
 class LLaMAResult(Result):
     def __init__(self, value=None, *args, **kwargs):
         super().__init__(value, *args, **kwargs)
         self._value = value
-        self.error  = None
-        self.raw    = value
+        self.error = None
+        self.raw = value
         self._perse_result()
     def _perse_result(self):
-        val        = json.loads(self.value)
+        val = json.loads(self.value)
         self.value = val
-        if 'error' in val:
-            self.error = val['error']
-        if 'content' in val:
-            self.value = val['content']
+        if "error" in val:
+            self.error = val["error"]
+        if "content" in val:
+            self.value = val["content"]
 class LLaMACppClientEngine(Engine):
-    def __init__(self, host: str = 'localhost', port: int = 8080, timeout: int = 240):
+    def __init__(self, host: str = "localhost", port: int = 8080, timeout: int = 240):
         super().__init__()
-        logger = logging.getLogger('nesy_client')
+        logger = logging.getLogger("nesy_client")
         logger.setLevel(logging.WARNING)
         self.config = SYMAI_CONFIG
         self.host = host
@@ -51,43 +51,45 @@ class LLaMACppClientEngine(Engine):
         self.name = self.__class__.__name__
     def id(self) -> str:
-        if  self.config['CAPTION_ENGINE_MODEL'] and \
-            'llavacpp' in self.config['CAPTION_ENGINE_MODEL']:
-            return 'imagecaptioning'
-        return super().id() # default to unregistered
+        if (
+            self.config["CAPTION_ENGINE_MODEL"]
+            and "llavacpp" in self.config["CAPTION_ENGINE_MODEL"]
+        ):
+            return "imagecaptioning"
+        return super().id()  # default to unregistered
     @property
     def max_tokens(self):
         return 4096
     def forward(self, argument):
-        prompts             = argument.prop.prepared_input
-        kwargs              = argument.kwargs
+        prompts = argument.prop.prepared_input
+        kwargs = argument.kwargs
         system, user, image = prompts
         # escape special characters
-        system              = system['content']
-        user                = user['content']
+        system = system["content"]
+        user = user["content"]
-        if isinstance(image['content'], Image):
+        if isinstance(image["content"], Image):
             # format image to bytes
-            format_ = argument.prop.image_format if argument.prop.image_format else 'PNG'
-            im_bytes = image_to_byte_array(image['content'], format=format_)
+            format_ = argument.prop.image_format if argument.prop.image_format else "PNG"
+            im_bytes = image_to_byte_array(image["content"], format=format_)
         else:
             # Convert image to bytes, open as binary
-            with open(image['content'], 'rb') as f:
+            with Path(image["content"]).open("rb") as f:
                 im_bytes = f.read()
         # Create multipart/form-data payload
-        payload      = MultipartEncoder(
+        payload = MultipartEncoder(
             fields={
-                'user_prompt': ('user_prompt', user, 'text/plain'),
-                'image_file': ('image_file', im_bytes, 'application/octet-stream'),
-                'system_prompt': ('system_prompt', system, 'text/plain')
+                "user_prompt": ("user_prompt", user, "text/plain"),
+                "image_file": ("image_file", im_bytes, "application/octet-stream"),
+                "system_prompt": ("system_prompt", system, "text/plain"),
             }
         )
         # Update the headers for multipart/form-data
-        headers       = {'Content-Type': payload.content_type}
-        api           = f'http://{self.host}:{self.port}/llava'
-        except_remedy = kwargs['except_remedy'] if 'except_remedy' in kwargs else None
+        headers = {"Content-Type": payload.content_type}
+        api = f"http://{self.host}:{self.port}/llava"
+        except_remedy = kwargs.get("except_remedy")
         try:
             # use http localhost 8000 to send a request to the server
             rsp = requests.post(api, data=payload, headers=headers, timeout=self.timeout)
@@ -95,27 +97,31 @@ class LLaMACppClientEngine(Engine):
         except Exception as e:
             if except_remedy is None:
                 raise e
-            callback = lambda: requests.post(api, data=payload, headers=headers, timeout=self.timeout)
+            def callback():
+                return requests.post(api, data=payload, headers=headers, timeout=self.timeout)
             res = except_remedy(self, e, callback, argument)
         metadata = {}
-        res    = LLaMAResult(res)
-        rsp    = [res]
+        res = LLaMAResult(res)
+        rsp = [res]
         output = rsp if isinstance(prompts, list) else rsp[0]
         return output, metadata
-    def prepare(self, argument):
-        if argument.prop.raw_input:
-            if not argument.prop.processed_input:
-                raise ValueError('Need to provide a prompt instruction to the engine if raw_input is enabled.')
-            argument.prop.prepared_input = argument.prop.processed_input
-            return
-        user:   str = ""
-        system: str = ""
-        system = f'{system}\n' if system and len(system) > 0 else ''
+    def _handle_raw_input(self, argument) -> bool:
+        if not argument.prop.raw_input:
+            return False
+        if not argument.prop.processed_input:
+            UserMessage(
+                "Need to provide a prompt instruction to the engine if raw_input is enabled.",
+                raise_with=ValueError,
+            )
+        argument.prop.prepared_input = argument.prop.processed_input
+        return True
+    def _append_context_sections(self, system: str, argument) -> str:
         ref = argument.prop.instance
         static_ctxt, dyn_ctxt = ref.global_context
         if len(static_ctxt) > 0:
@@ -126,40 +132,57 @@ class LLaMACppClientEngine(Engine):
         payload = argument.prop.payload
         if argument.prop.payload:
-            system += f"[ADDITIONAL CONTEXT]\n{str(payload)}\n\n"
+            system += f"[ADDITIONAL CONTEXT]\n{payload!s}\n\n"
-        examples: List[str] = argument.prop.examples
+        examples: list[str] = argument.prop.examples
         if examples and len(examples) > 0:
-            system += f"[EXAMPLES]\n{str(examples)}\n\n"
+            system += f"[EXAMPLES]\n{examples!s}\n\n"
+        return system
+    def _build_user_instruction(self, argument) -> str:
+        user = ""
         if argument.prop.prompt is not None and len(argument.prop.prompt) > 0:
             val = str(argument.prop.prompt)
-            # in this engine, instructions are considered as user prompts
             user += f"[INSTRUCTION]\n{val}"
-        suffix: str = str(argument.prop.processed_input)
-        if '[SYSTEM_INSTRUCTION::]: <<<' in suffix and argument.prop.parse_system_instructions:
-            parts = suffix.split('\n>>>\n')
-            # first parts are the system instructions
-            c = 0
-            for i, p in enumerate(parts):
-                if 'SYSTEM_INSTRUCTION' in p:
-                    system += f"{p}\n"
-                    c += 1
+        return user
+    def _extract_system_instructions(self, argument, system: str, suffix: str) -> tuple[str, str]:
+        if "[SYSTEM_INSTRUCTION::]: <<<" in suffix and argument.prop.parse_system_instructions:
+            parts = suffix.split("\n>>>\n")
+            consumed = 0
+            for part in parts:
+                if "SYSTEM_INSTRUCTION" in part:
+                    system += f"{part}\n"
+                    consumed += 1
                 else:
                     break
-            # last part is the user input
-            suffix = '\n>>>\n'.join(parts[c:])
-        user += f"{suffix}"
+            suffix = "\n>>>\n".join(parts[consumed:])
+        return system, suffix
+    def _append_template_suffix(self, user: str, argument) -> str:
         if argument.prop.template_suffix:
-            user += f"\n[[PLACEHOLDER]]\n{str(argument.prop.template_suffix)}\n\n"
-            user += f"Only generate content for the placeholder `[[PLACEHOLDER]]` following the instructions and context information. Do NOT write `[[PLACEHOLDER]]` or anything else in your output.\n\n"
+            user += f"\n[[PLACEHOLDER]]\n{argument.prop.template_suffix!s}\n\n"
+            user += "Only generate content for the placeholder `[[PLACEHOLDER]]` following the instructions and context information. Do NOT write `[[PLACEHOLDER]]` or anything else in your output.\n\n"
+        return user
+    def prepare(self, argument):
+        if self._handle_raw_input(argument):
+            return
+        system: str = ""
+        system = f"{system}\n" if system and len(system) > 0 else ""
+        system = self._append_context_sections(system, argument)
+        user = self._build_user_instruction(argument)
+        suffix: str = str(argument.prop.processed_input)
+        system, suffix = self._extract_system_instructions(argument, system, suffix)
+        user += f"{suffix}"
+        user = self._append_template_suffix(user, argument)
-        user_prompt = { "role": "user", "content": user }
+        user_prompt = {"role": "user", "content": user}
         argument.prop.prepared_input = [
-            { "role": "system", "content": system },
+            {"role": "system", "content": system},
             user_prompt,
-            { "role": "image", "content": argument.prop.image }
+            {"role": "image", "content": argument.prop.image},
         ]

symbolicai 0.21.0__py3-none-any.whl → 1.1.0__py3-none-any.whl

symbolicai 0.21.0py3-none-any.whl → 1.1.0py3-none-any.whl