PyPI - lionagi - Versions diffs - 0.1.2__py3-none-any.whl → 0.2.0__py3-none-any.whl - Mend

lionagi 0.1.2py3-none-any.whl → 0.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (268) hide show

lionagi/__init__.py +60 -5
lionagi/core/__init__.py +0 -25
lionagi/core/_setting/_setting.py +59 -0
lionagi/core/action/__init__.py +14 -0
lionagi/core/action/function_calling.py +136 -0
lionagi/core/action/manual.py +1 -0
lionagi/core/action/node.py +109 -0
lionagi/core/action/tool.py +114 -0
lionagi/core/action/tool_manager.py +356 -0
lionagi/core/agent/base_agent.py +27 -13
lionagi/core/agent/eval/evaluator.py +1 -0
lionagi/core/agent/eval/vote.py +40 -0
lionagi/core/agent/learn/learner.py +59 -0
lionagi/core/agent/plan/unit_template.py +1 -0
lionagi/core/collections/__init__.py +17 -0
lionagi/core/{generic/data_logger.py → collections/_logger.py} +69 -55
lionagi/core/collections/abc/__init__.py +53 -0
lionagi/core/collections/abc/component.py +615 -0
lionagi/core/collections/abc/concepts.py +297 -0
lionagi/core/collections/abc/exceptions.py +150 -0
lionagi/core/collections/abc/util.py +45 -0
lionagi/core/collections/exchange.py +161 -0
lionagi/core/collections/flow.py +426 -0
lionagi/core/collections/model.py +419 -0
lionagi/core/collections/pile.py +913 -0
lionagi/core/collections/progression.py +236 -0
lionagi/core/collections/util.py +64 -0
lionagi/core/director/direct.py +314 -0
lionagi/core/director/director.py +2 -0
lionagi/core/{execute/branch_executor.py → engine/branch_engine.py} +134 -97
lionagi/core/{execute/instruction_map_executor.py → engine/instruction_map_engine.py} +80 -55
lionagi/{experimental/directive/evaluator → core/engine}/script_engine.py +17 -1
lionagi/core/executor/base_executor.py +90 -0
lionagi/core/{execute/structure_executor.py → executor/graph_executor.py} +62 -66
lionagi/core/{execute → executor}/neo4j_executor.py +70 -67
lionagi/core/generic/__init__.py +3 -33
lionagi/core/generic/edge.py +29 -79
lionagi/core/generic/edge_condition.py +16 -0
lionagi/core/generic/graph.py +236 -0
lionagi/core/generic/hyperedge.py +1 -0
lionagi/core/generic/node.py +156 -221
lionagi/core/generic/tree.py +48 -0
lionagi/core/generic/tree_node.py +79 -0
lionagi/core/mail/__init__.py +12 -0
lionagi/core/mail/mail.py +25 -0
lionagi/core/mail/mail_manager.py +139 -58
lionagi/core/mail/package.py +45 -0
lionagi/core/mail/start_mail.py +36 -0
lionagi/core/message/__init__.py +19 -0
lionagi/core/message/action_request.py +133 -0
lionagi/core/message/action_response.py +135 -0
lionagi/core/message/assistant_response.py +95 -0
lionagi/core/message/instruction.py +234 -0
lionagi/core/message/message.py +101 -0
lionagi/core/message/system.py +86 -0
lionagi/core/message/util.py +283 -0
lionagi/core/report/__init__.py +4 -0
lionagi/core/report/base.py +217 -0
lionagi/core/report/form.py +231 -0
lionagi/core/report/report.py +166 -0
lionagi/core/report/util.py +28 -0
lionagi/core/rule/_default.py +16 -0
lionagi/core/rule/action.py +99 -0
lionagi/core/rule/base.py +238 -0
lionagi/core/rule/boolean.py +56 -0
lionagi/core/rule/choice.py +47 -0
lionagi/core/rule/mapping.py +96 -0
lionagi/core/rule/number.py +71 -0
lionagi/core/rule/rulebook.py +109 -0
lionagi/core/rule/string.py +52 -0
lionagi/core/rule/util.py +35 -0
lionagi/core/session/branch.py +431 -0
lionagi/core/session/directive_mixin.py +287 -0
lionagi/core/session/session.py +229 -903
lionagi/core/structure/__init__.py +1 -0
lionagi/core/structure/chain.py +1 -0
lionagi/core/structure/forest.py +1 -0
lionagi/core/structure/graph.py +1 -0
lionagi/core/structure/tree.py +1 -0
lionagi/core/unit/__init__.py +5 -0
lionagi/core/unit/parallel_unit.py +245 -0
lionagi/core/unit/template/action.py +81 -0
lionagi/core/unit/template/base.py +51 -0
lionagi/core/unit/template/plan.py +84 -0
lionagi/core/unit/template/predict.py +109 -0
lionagi/core/unit/template/score.py +124 -0
lionagi/core/unit/template/select.py +104 -0
lionagi/core/unit/unit.py +362 -0
lionagi/core/unit/unit_form.py +305 -0
lionagi/core/unit/unit_mixin.py +1168 -0
lionagi/core/unit/util.py +71 -0
lionagi/core/validator/validator.py +364 -0
lionagi/core/work/work.py +74 -0
lionagi/core/work/work_function.py +92 -0
lionagi/core/work/work_queue.py +81 -0
lionagi/core/work/worker.py +195 -0
lionagi/core/work/worklog.py +124 -0
lionagi/experimental/compressor/base.py +46 -0
lionagi/experimental/compressor/llm_compressor.py +247 -0
lionagi/experimental/compressor/llm_summarizer.py +61 -0
lionagi/experimental/compressor/util.py +70 -0
lionagi/experimental/directive/__init__.py +19 -0
lionagi/experimental/directive/parser/base_parser.py +69 -2
lionagi/experimental/directive/{template_ → template}/base_template.py +17 -1
lionagi/{libs/ln_tokenizer.py → experimental/directive/tokenizer.py} +16 -0
lionagi/experimental/{directive/evaluator → evaluator}/ast_evaluator.py +16 -0
lionagi/experimental/{directive/evaluator → evaluator}/base_evaluator.py +16 -0
lionagi/experimental/knowledge/base.py +10 -0
lionagi/experimental/memory/__init__.py +0 -0
lionagi/experimental/strategies/__init__.py +0 -0
lionagi/experimental/strategies/base.py +1 -0
lionagi/integrations/bridge/langchain_/documents.py +4 -0
lionagi/integrations/bridge/llamaindex_/index.py +30 -0
lionagi/integrations/bridge/llamaindex_/llama_index_bridge.py +6 -0
lionagi/integrations/chunker/chunk.py +161 -24
lionagi/integrations/config/oai_configs.py +34 -3
lionagi/integrations/config/openrouter_configs.py +14 -2
lionagi/integrations/loader/load.py +122 -21
lionagi/integrations/loader/load_util.py +6 -77
lionagi/integrations/provider/_mapping.py +46 -0
lionagi/integrations/provider/litellm.py +2 -1
lionagi/integrations/provider/mlx_service.py +16 -9
lionagi/integrations/provider/oai.py +91 -4
lionagi/integrations/provider/ollama.py +6 -5
lionagi/integrations/provider/openrouter.py +115 -8
lionagi/integrations/provider/services.py +2 -2
lionagi/integrations/provider/transformers.py +18 -22
lionagi/integrations/storage/__init__.py +3 -3
lionagi/integrations/storage/neo4j.py +52 -60
lionagi/integrations/storage/storage_util.py +44 -46
lionagi/integrations/storage/structure_excel.py +43 -26
lionagi/integrations/storage/to_excel.py +11 -4
lionagi/libs/__init__.py +22 -1
lionagi/libs/ln_api.py +75 -20
lionagi/libs/ln_context.py +37 -0
lionagi/libs/ln_convert.py +21 -9
lionagi/libs/ln_func_call.py +69 -28
lionagi/libs/ln_image.py +107 -0
lionagi/libs/ln_nested.py +26 -11
lionagi/libs/ln_parse.py +82 -23
lionagi/libs/ln_queue.py +16 -0
lionagi/libs/ln_tokenize.py +164 -0
lionagi/libs/ln_validate.py +16 -0
lionagi/libs/special_tokens.py +172 -0
lionagi/libs/sys_util.py +95 -24
lionagi/lions/coder/code_form.py +13 -0
lionagi/lions/coder/coder.py +50 -3
lionagi/lions/coder/util.py +30 -25
lionagi/tests/libs/test_func_call.py +23 -21
lionagi/tests/libs/test_nested.py +36 -21
lionagi/tests/libs/test_parse.py +1 -1
lionagi/tests/test_core/collections/__init__.py +0 -0
lionagi/tests/test_core/collections/test_component.py +206 -0
lionagi/tests/test_core/collections/test_exchange.py +138 -0
lionagi/tests/test_core/collections/test_flow.py +145 -0
lionagi/tests/test_core/collections/test_pile.py +171 -0
lionagi/tests/test_core/collections/test_progression.py +129 -0
lionagi/tests/test_core/generic/test_edge.py +67 -0
lionagi/tests/test_core/generic/test_graph.py +96 -0
lionagi/tests/test_core/generic/test_node.py +106 -0
lionagi/tests/test_core/generic/test_tree_node.py +73 -0
lionagi/tests/test_core/test_branch.py +115 -294
lionagi/tests/test_core/test_form.py +46 -0
lionagi/tests/test_core/test_report.py +105 -0
lionagi/tests/test_core/test_validator.py +111 -0
lionagi/version.py +1 -1
lionagi-0.2.0.dist-info/LICENSE +202 -0
lionagi-0.2.0.dist-info/METADATA +272 -0
lionagi-0.2.0.dist-info/RECORD +240 -0
lionagi/core/branch/base.py +0 -653
lionagi/core/branch/branch.py +0 -474
lionagi/core/branch/flow_mixin.py +0 -96
lionagi/core/branch/util.py +0 -323
lionagi/core/direct/__init__.py +0 -19
lionagi/core/direct/cot.py +0 -123
lionagi/core/direct/plan.py +0 -164
lionagi/core/direct/predict.py +0 -166
lionagi/core/direct/react.py +0 -171
lionagi/core/direct/score.py +0 -279
lionagi/core/direct/select.py +0 -170
lionagi/core/direct/sentiment.py +0 -1
lionagi/core/direct/utils.py +0 -110
lionagi/core/direct/vote.py +0 -64
lionagi/core/execute/base_executor.py +0 -47
lionagi/core/flow/baseflow.py +0 -23
lionagi/core/flow/monoflow/ReAct.py +0 -240
lionagi/core/flow/monoflow/__init__.py +0 -9
lionagi/core/flow/monoflow/chat.py +0 -95
lionagi/core/flow/monoflow/chat_mixin.py +0 -253
lionagi/core/flow/monoflow/followup.py +0 -215
lionagi/core/flow/polyflow/__init__.py +0 -1
lionagi/core/flow/polyflow/chat.py +0 -251
lionagi/core/form/action_form.py +0 -26
lionagi/core/form/field_validator.py +0 -287
lionagi/core/form/form.py +0 -302
lionagi/core/form/mixin.py +0 -214
lionagi/core/form/scored_form.py +0 -13
lionagi/core/generic/action.py +0 -26
lionagi/core/generic/component.py +0 -532
lionagi/core/generic/condition.py +0 -46
lionagi/core/generic/mail.py +0 -90
lionagi/core/generic/mailbox.py +0 -36
lionagi/core/generic/relation.py +0 -70
lionagi/core/generic/signal.py +0 -22
lionagi/core/generic/structure.py +0 -362
lionagi/core/generic/transfer.py +0 -20
lionagi/core/generic/work.py +0 -40
lionagi/core/graph/graph.py +0 -126
lionagi/core/graph/tree.py +0 -190
lionagi/core/mail/schema.py +0 -63
lionagi/core/messages/schema.py +0 -325
lionagi/core/tool/__init__.py +0 -5
lionagi/core/tool/tool.py +0 -28
lionagi/core/tool/tool_manager.py +0 -283
lionagi/experimental/report/form.py +0 -64
lionagi/experimental/report/report.py +0 -138
lionagi/experimental/report/util.py +0 -47
lionagi/experimental/tool/function_calling.py +0 -43
lionagi/experimental/tool/manual.py +0 -66
lionagi/experimental/tool/schema.py +0 -59
lionagi/experimental/tool/tool_manager.py +0 -138
lionagi/experimental/tool/util.py +0 -16
lionagi/experimental/validator/rule.py +0 -139
lionagi/experimental/validator/validator.py +0 -56
lionagi/experimental/work/__init__.py +0 -10
lionagi/experimental/work/async_queue.py +0 -54
lionagi/experimental/work/schema.py +0 -73
lionagi/experimental/work/work_function.py +0 -67
lionagi/experimental/work/worker.py +0 -56
lionagi/experimental/work2/form.py +0 -371
lionagi/experimental/work2/report.py +0 -289
lionagi/experimental/work2/schema.py +0 -30
lionagi/experimental/work2/tests.py +0 -72
lionagi/experimental/work2/work_function.py +0 -89
lionagi/experimental/work2/worker.py +0 -12
lionagi/integrations/bridge/llamaindex_/get_index.py +0 -294
lionagi/tests/test_core/generic/test_component.py +0 -89
lionagi/tests/test_core/test_base_branch.py +0 -426
lionagi/tests/test_core/test_chat_flow.py +0 -63
lionagi/tests/test_core/test_mail_manager.py +0 -75
lionagi/tests/test_core/test_prompts.py +0 -51
lionagi/tests/test_core/test_session.py +0 -254
lionagi/tests/test_core/test_session_base_util.py +0 -313
lionagi/tests/test_core/test_tool_manager.py +0 -95
lionagi-0.1.2.dist-info/LICENSE +0 -9
lionagi-0.1.2.dist-info/METADATA +0 -174
lionagi-0.1.2.dist-info/RECORD +0 -206
/lionagi/core/{branch → _setting}/__init__.py +0 -0
/lionagi/core/{execute → agent/eval}/__init__.py +0 -0
/lionagi/core/{flow → agent/learn}/__init__.py +0 -0
/lionagi/core/{form → agent/plan}/__init__.py +0 -0
/lionagi/core/{branch/executable_branch.py → agent/plan/plan.py} +0 -0
/lionagi/core/{graph → director}/__init__.py +0 -0
/lionagi/core/{messages → engine}/__init__.py +0 -0
/lionagi/{experimental/directive/evaluator → core/engine}/sandbox_.py +0 -0
/lionagi/{experimental/directive/evaluator → core/executor}/__init__.py +0 -0
/lionagi/{experimental/directive/template_ → core/rule}/__init__.py +0 -0
/lionagi/{experimental/report → core/unit/template}/__init__.py +0 -0
/lionagi/{experimental/tool → core/validator}/__init__.py +0 -0
/lionagi/{experimental/validator → core/work}/__init__.py +0 -0
/lionagi/experimental/{work2 → compressor}/__init__.py +0 -0
/lionagi/{core/flow/mono_chat_mixin.py → experimental/directive/template/__init__.py} +0 -0
/lionagi/experimental/directive/{schema.py → template/schema.py} +0 -0
/lionagi/experimental/{work2/util.py → evaluator/__init__.py} +0 -0
/lionagi/experimental/{work2/work.py → knowledge/__init__.py} +0 -0
/lionagi/{tests/libs/test_async.py → experimental/knowledge/graph.py} +0 -0
{lionagi-0.1.2.dist-info → lionagi-0.2.0.dist-info}/WHEEL +0 -0
{lionagi-0.1.2.dist-info → lionagi-0.2.0.dist-info}/top_level.txt +0 -0

lionagi/libs/ln_image.py ADDED Viewed

@@ -0,0 +1,107 @@
+import base64
+import numpy as np
+from typing import Optional
+from .sys_util import SysUtil
+class ImageUtil:
+    @staticmethod
+    def preprocess_image(
+        image: np.ndarray, color_conversion_code: Optional[int] = None
+    ) -> np.ndarray:
+        SysUtil.check_import("cv2", pip_name="opencv-python")
+        import cv2
+        color_conversion_code = color_conversion_code or cv2.COLOR_BGR2RGB
+        return cv2.cvtColor(image, color_conversion_code)
+    @staticmethod
+    def encode_image_to_base64(image: np.ndarray, file_extension: str = ".jpg") -> str:
+        SysUtil.check_import("cv2", pip_name="opencv-python")
+        import cv2
+        success, buffer = cv2.imencode(file_extension, image)
+        if not success:
+            raise ValueError(f"Could not encode image to {file_extension} format.")
+        encoded_image = base64.b64encode(buffer).decode("utf-8")
+        return encoded_image
+    @staticmethod
+    def read_image_to_array(
+        image_path: str, color_flag: Optional[int] = None
+    ) -> np.ndarray:
+        SysUtil.check_import("cv2", pip_name="opencv-python")
+        import cv2
+        image = cv2.imread(image_path, color_flag)
+        color_flag = color_flag or cv2.IMREAD_COLOR
+        if image is None:
+            raise ValueError(f"Could not read image from path: {image_path}")
+        return image
+    @staticmethod
+    def read_image_to_base64(
+        image_path: str,
+        color_flag: Optional[int] = None,
+    ) -> str:
+        image_path = str(image_path)
+        image = ImageUtil.read_image_to_array(image_path, color_flag)
+        file_extension = "." + image_path.split(".")[-1]
+        return ImageUtil.encode_image_to_base64(image, file_extension)
+    # @staticmethod
+    # def encode_image(image_path):
+    #     with open(image_path, "rb") as image_file:
+    #         return base64.b64encode(image_file.read()).decode("utf-8")
+    @staticmethod
+    def calculate_image_token_usage_from_base64(image_base64: str, detail):
+        """
+        Calculate the token usage for processing OpenAI images from a base64-encoded string.
+        Parameters:
+        image_base64 (str): The base64-encoded string of the image.
+        detail (str): The detail level of the image, either 'low' or 'high'.
+        Returns:
+        int: The total token cost for processing the image.
+        """
+        import base64
+        from io import BytesIO
+        from PIL import Image
+        # Decode the base64 string to get image data
+        if "data:image/jpeg;base64," in image_base64:
+            image_base64 = image_base64.split("data:image/jpeg;base64,")[1]
+            image_base64.strip("{}")
+        image_data = base64.b64decode(image_base64)
+        image = Image.open(BytesIO(image_data))
+        # Get image dimensions
+        width, height = image.size
+        if detail == "low":
+            return 85
+        # Scale to fit within a 2048 x 2048 square
+        max_dimension = 2048
+        if width > max_dimension or height > max_dimension:
+            scale_factor = max_dimension / max(width, height)
+            width = int(width * scale_factor)
+            height = int(height * scale_factor)
+        # Scale such that the shortest side is 768px
+        min_side = 768
+        if min(width, height) > min_side:
+            scale_factor = min_side / min(width, height)
+            width = int(width * scale_factor)
+            height = int(height * scale_factor)
+        # Calculate the number of 512px squares
+        num_squares = (width // 512) * (height // 512)
+        token_cost = 170 * num_squares + 85
+        return token_cost

lionagi/libs/ln_nested.py CHANGED Viewed

@@ -1,3 +1,19 @@
+"""
+Copyright 2024 HaiyangLi
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+    http://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
 from collections import defaultdict
 from itertools import chain
 from typing import Any, Generator, Callable
@@ -52,7 +68,7 @@ def nset(nested_structure: dict | list, indices: list[int | str], value: Any) ->
 def nget(
     nested_structure: dict | list,
     indices: list[int | str],
-    default: Any | None = None,
+    default=...,
 ) -> Any:
     """
     retrieves a value from a nested list or dictionary structure, with an option to
@@ -98,12 +114,12 @@ def nget(
             return target_container[last_index]
         elif isinstance(target_container, dict) and last_index in target_container:
             return target_container[last_index]
-        elif default is not None:
+        elif default is not ...:
             return default
         else:
             raise LookupError("Target not found and no default value provided.")
     except (IndexError, KeyError, TypeError):
-        if default is not None:
+        if default is not ...:
             return default
         else:
             raise LookupError("Target not found and no default value provided.")
@@ -116,7 +132,7 @@ def nmerge(
     *,
     overwrite: bool = False,
     dict_sequence: bool = False,
-    sequence_separator: str = "_",
+    sequence_separator: str = "[^_^]",
     sort_list: bool = False,
     custom_sort: Callable[[Any], Any] | None = None,
 ) -> dict | list:
@@ -176,7 +192,7 @@ def flatten(
     /,
     *,
     parent_key: str = "",
-    sep: str = "_",
+    sep: str = "[^_^]",
     max_depth: int | None = None,
     inplace: bool = False,
     dict_only: bool = False,
@@ -238,7 +254,7 @@ def unflatten(
     flat_dict: dict[str, Any],
     /,
     *,
-    sep: str = "_",
+    sep: str = "[^_^]",
     custom_logic: Callable[[str], Any] | None = None,
     max_depth: int | None = None,
 ) -> dict | list:
@@ -330,7 +346,7 @@ def ninsert(
     indices: list[str | int],
     value: Any,
     *,
-    sep: str = "_",
+    sep: str = "[^_^]",
     max_depth: int | None = None,
     current_depth: int = 0,
 ) -> None:
@@ -393,12 +409,11 @@ def ninsert(
         nested_structure[last_part] = value
-# noinspection PyDecorator
 def get_flattened_keys(
     nested_structure: Any,
     /,
     *,
-    sep: str = "_",
+    sep: str = "[^_^]",
     max_depth: int | None = None,
     dict_only: bool = False,
     inplace: bool = False,
@@ -448,7 +463,7 @@ def _dynamic_flatten_in_place(
     /,
     *,
     parent_key: str = "",
-    sep: str = "_",
+    sep: str = "[^_^]",
     max_depth: int | None = None,
     current_depth: int = 0,
     dict_only: bool = False,
@@ -581,7 +596,7 @@ def _deep_update(original: dict, update: dict) -> dict:
 def _dynamic_flatten_generator(
     nested_structure: Any,
     parent_key: tuple[str, ...],
-    sep: str = "_",
+    sep: str = "[^_^]",
     max_depth: int | None = None,
     current_depth: int = 0,
     dict_only: bool = False,

lionagi/libs/ln_parse.py CHANGED Viewed

@@ -1,9 +1,23 @@
+"""
+Copyright 2024 HaiyangLi
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+    http://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
 from collections.abc import Callable
 import re
 import inspect
 import itertools
-import contextlib
-from functools import singledispatchmethod
 from typing import Any
 import numpy as np
 import lionagi.libs.ln_convert as convert
@@ -103,12 +117,12 @@ class ParseUtil:
     # inspired by langchain_core.output_parsers.json (MIT License)
     # https://github.com/langchain-ai/langchain/blob/master/libs/core/langchain_core/output_parsers/json.py
     @staticmethod
-    def extract_code_block(
+    def extract_json_block(
         str_to_parse: str,
         language: str | None = None,
         regex_pattern: str | None = None,
         *,
-        parser: Callable[[str], Any],
+        parser: Callable[[str], Any] = None,
     ) -> Any:
         """
         Extracts and parses a code block from Markdown content.
@@ -148,9 +162,37 @@ class ParseUtil:
             raise ValueError(
                 f"No {language or 'specified'} code block found in the Markdown content."
             )
+        if not match:
+            str_to_parse = str_to_parse.strip()
+            if str_to_parse.startswith("```json\n") and str_to_parse.endswith("\n```"):
+                str_to_parse = str_to_parse[8:-4].strip()
+        parser = parser or ParseUtil.fuzzy_parse_json
         return parser(code_str)
+    @staticmethod
+    def extract_code_blocks(code):
+        code_blocks = []
+        lines = code.split("\n")
+        inside_code_block = False
+        current_block = []
+        for line in lines:
+            if line.startswith("```"):
+                if inside_code_block:
+                    code_blocks.append("\n".join(current_block))
+                    current_block = []
+                    inside_code_block = False
+                else:
+                    inside_code_block = True
+            elif inside_code_block:
+                current_block.append(line)
+        if current_block:
+            code_blocks.append("\n".join(current_block))
+        return "\n\n".join(code_blocks)
     @staticmethod
     def md_to_json(
         str_to_parse: str,
@@ -181,7 +223,7 @@ class ParseUtil:
                 >>> md_to_json('```json\\n{"key": "value"}\\n```', expected_keys=['key'])
                 {'key': 'value'}
         """
-        json_obj = ParseUtil.extract_code_block(
+        json_obj = ParseUtil.extract_json_block(
             str_to_parse, language="json", parser=parser or ParseUtil.fuzzy_parse_json
         )
@@ -385,7 +427,9 @@ class ParseUtil:
         return type_mapping.get(py_type, "object")
     @staticmethod
-    def _func_to_schema(func, style="google"):
+    def _func_to_schema(
+        func, style="google", func_description=None, params_description=None
+    ):
         """
         Generates a schema description for a given function, using typing hints and
         docstrings. The schema includes the function's name, description, and parameters.
@@ -412,9 +456,11 @@ class ParseUtil:
         """
         # Extracting function name and docstring details
         func_name = func.__name__
-        func_description, params_description = ParseUtil._extract_docstring_details(
-            func, style
-        )
+        if not func_description:
+            func_description, _ = ParseUtil._extract_docstring_details(func, style)
+        if not params_description:
+            _, params_description = ParseUtil._extract_docstring_details(func, style)
         # Extracting parameters with typing hints
         sig = inspect.signature(func)
@@ -634,7 +680,7 @@ class StringMatch:
         # Calculate Jaro-Winkler similarity scores for each potential match
         scores = np.array(
             [
-                score_func(convert.to_str(word), correct_word)
+                score_func(str(word), str(correct_word))
                 for correct_word in correct_words_list
             ]
         )
@@ -648,26 +694,39 @@ class StringMatch:
         if isinstance(out_, str):
             # first try to parse it straight as a fuzzy json
             try:
                 out_ = ParseUtil.fuzzy_parse_json(out_)
-            except Exception:
+                return StringMatch.correct_dict_keys(keys, out_)
+            except:
                 try:
-                    # if failed we try to extract the json block and parse it
                     out_ = ParseUtil.md_to_json(out_)
+                    return StringMatch.correct_dict_keys(keys, out_)
                 except Exception:
-                    # if still failed we try to extract the json block using re and parse it again
-                    match = re.search(r"```json\n({.*?})\n```", out_, re.DOTALL)
-                    if match:
-                        out_ = match.group(1)
-                        try:
-                            out_ = ParseUtil.fuzzy_parse_json(out_)
-                        except:
+                    try:
+                        # if failed we try to extract the json block and parse it
+                        out_ = ParseUtil.md_to_json(out_)
+                        return StringMatch.correct_dict_keys(keys, out_)
+                    except Exception:
+                        # if still failed we try to extract the json block using re and parse it again
+                        match = re.search(r"```json\n({.*?})\n```", out_, re.DOTALL)
+                        if match:
+                            out_ = match.group(1)
                             try:
-                                out_ = ParseUtil.fuzzy_parse_json(
-                                    out_.replace("'", '"')
-                                )
+                                out_ = ParseUtil.fuzzy_parse_json(out_)
+                                return StringMatch.correct_dict_keys(keys, out_)
                             except:
-                                pass
+                                try:
+                                    out_ = ParseUtil.fuzzy_parse_json(
+                                        out_.replace("'", '"')
+                                    )
+                                    return StringMatch.correct_dict_keys(keys, out_)
+                                except:
+                                    pass
         if isinstance(out_, dict):
             try:

lionagi/libs/ln_queue.py CHANGED Viewed

@@ -1,3 +1,19 @@
+"""
+Copyright 2024 HaiyangLi
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+    http://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
 """
 A class that manages asynchronous task processing with controlled concurrency.
 """

lionagi/libs/ln_tokenize.py ADDED Viewed

@@ -0,0 +1,164 @@
+import tiktoken
+import math
+from .ln_convert import to_str
+from .special_tokens import disallowed_tokens
+class TokenizeUtil:
+    @staticmethod
+    def tokenize(
+        text,
+        encoding_model=None,
+        encoding_name=None,
+        return_byte=False,
+        disallowed_tokens=disallowed_tokens,
+    ):
+        encoding = None
+        if encoding_model:
+            try:
+                encoding_name = tiktoken.encoding_name_for_model(encoding_model)
+            except:
+                encoding_name = encoding_name or "cl100k_base"
+        if not encoding_name or encoding_name in tiktoken.list_encoding_names():
+            encoding_name = encoding_name or "cl100k_base"
+            encoding = tiktoken.get_encoding(encoding_name)
+        special_encodings = (
+            [encoding.encode(token) for token in disallowed_tokens]
+            if disallowed_tokens
+            else []
+        )
+        codes = encoding.encode(text)
+        if special_encodings and len(special_encodings) > 0:
+            codes = [code for code in codes if code not in special_encodings]
+        if return_byte:
+            return codes
+        return [encoding.decode([code]) for code in codes]
+    @staticmethod
+    def chunk_by_chars(
+        text: str, chunk_size: int, overlap: float, threshold: int
+    ) -> list[str | None]:
+        """
+        Chunks the input text into smaller parts, with optional overlap and threshold for final chunk.
+        Parameters:
+            text (str): The input text to chunk.
+            chunk_size (int): The size of each chunk.
+            overlap (float): The amount of overlap between chunks.
+            threshold (int): The minimum size of the final chunk.
+        Returns:
+            List[Union[str, None]]: A list of text chunks.
+        Raises:
+            ValueError: If an error occurs during chunking.
+        """
+        def _chunk_n1():
+            return [text]
+        def _chunk_n2():
+            chunks = []
+            chunks.append(text[: chunk_size + overlap_size])
+            if len(text) - chunk_size > threshold:
+                chunks.append(text[chunk_size - overlap_size :])
+            else:
+                return _chunk_n1()
+            return chunks
+        def _chunk_n3():
+            chunks = []
+            chunks.append(text[: chunk_size + overlap_size])
+            for i in range(1, n_chunks - 1):
+                start_idx = chunk_size * i - overlap_size
+                end_idx = chunk_size * (i + 1) + overlap_size
+                chunks.append(text[start_idx:end_idx])
+            if len(text) - chunk_size * (n_chunks - 1) > threshold:
+                chunks.append(text[chunk_size * (n_chunks - 1) - overlap_size :])
+            else:
+                chunks[-1] += text[chunk_size * (n_chunks - 1) + overlap_size :]
+            return chunks
+        try:
+            if not isinstance(text, str):
+                text = to_str(text)
+            n_chunks = math.ceil(len(text) / chunk_size)
+            overlap_size = int(overlap / 2)
+            if n_chunks == 1:
+                return _chunk_n1()
+            elif n_chunks == 2:
+                return _chunk_n2()
+            elif n_chunks > 2:
+                return _chunk_n3()
+        except Exception as e:
+            raise ValueError(f"An error occurred while chunking the text. {e}")
+    @staticmethod
+    def chunk_by_tokens(
+        text: str,
+        chunk_size: int,
+        overlap: float,
+        threshold: int,  # minimum size of the final chunk in number of tokens
+        encoding_model=None,
+        encoding_name=None,
+        return_tokens=False,
+        return_byte=False,
+    ) -> list[str | None]:
+        tokens = TokenizeUtil.tokenize(
+            text, encoding_model, encoding_name, return_byte=return_byte
+        )
+        n_chunks = math.ceil(len(tokens) / chunk_size)
+        overlap_size = int(overlap * chunk_size / 2)
+        residue = len(tokens) % chunk_size
+        if n_chunks == 1:
+            return text if not return_tokens else [tokens]
+        elif n_chunks == 2:
+            chunks = [tokens[: chunk_size + overlap_size]]
+            if residue > threshold:
+                chunks.append(tokens[chunk_size - overlap_size :])
+                return (
+                    [" ".join(chunk).strip() for chunk in chunks]
+                    if not return_tokens
+                    else chunks
+                )
+            else:
+                return text if not return_tokens else [tokens]
+        elif n_chunks > 2:
+            chunks = []
+            chunks.append(tokens[: chunk_size + overlap_size])
+            for i in range(1, n_chunks - 1):
+                start_idx = chunk_size * i - overlap_size
+                end_idx = chunk_size * (i + 1) + overlap_size
+                chunks.append(tokens[start_idx:end_idx])
+            if len(tokens) - chunk_size * (n_chunks - 1) > threshold:
+                chunks.append(tokens[chunk_size * (n_chunks - 1) - overlap_size :])
+            else:
+                chunks[-1] += tokens[-residue:]
+            return (
+                [" ".join(chunk) for chunk in chunks] if not return_tokens else chunks
+            )

lionagi/libs/ln_validate.py CHANGED Viewed

@@ -1,3 +1,19 @@
+"""
+Copyright 2024 HaiyangLi
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+    http://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
 """
 This module provides functions for validating and fixing field values based on their data types.

lionagi 0.1.2__py3-none-any.whl → 0.2.0__py3-none-any.whl

lionagi 0.1.2py3-none-any.whl → 0.2.0py3-none-any.whl