PyPI - lionagi - Versions diffs - 0.1.1__py3-none-any.whl → 0.2.0__py3-none-any.whl - Mend

lionagi 0.1.1py3-none-any.whl → 0.2.0py3-none-any.whl

Files changed (257) hide show

lionagi/__init__.py +60 -5
lionagi/core/__init__.py +0 -25
lionagi/core/_setting/_setting.py +59 -0
lionagi/core/action/__init__.py +14 -0
lionagi/core/action/function_calling.py +136 -0
lionagi/core/action/manual.py +1 -0
lionagi/core/action/node.py +109 -0
lionagi/core/action/tool.py +114 -0
lionagi/core/action/tool_manager.py +356 -0
lionagi/core/agent/base_agent.py +27 -13
lionagi/core/agent/eval/evaluator.py +1 -0
lionagi/core/agent/eval/vote.py +40 -0
lionagi/core/agent/learn/learner.py +59 -0
lionagi/core/agent/plan/unit_template.py +1 -0
lionagi/core/collections/__init__.py +17 -0
lionagi/core/{generic/data_logger.py → collections/_logger.py} +69 -55
lionagi/core/collections/abc/__init__.py +53 -0
lionagi/core/collections/abc/component.py +615 -0
lionagi/core/collections/abc/concepts.py +297 -0
lionagi/core/collections/abc/exceptions.py +150 -0
lionagi/core/collections/abc/util.py +45 -0
lionagi/core/collections/exchange.py +161 -0
lionagi/core/collections/flow.py +426 -0
lionagi/core/collections/model.py +419 -0
lionagi/core/collections/pile.py +913 -0
lionagi/core/collections/progression.py +236 -0
lionagi/core/collections/util.py +64 -0
lionagi/core/director/direct.py +314 -0
lionagi/core/director/director.py +2 -0
lionagi/core/{execute/branch_executor.py → engine/branch_engine.py} +134 -97
lionagi/core/{execute/instruction_map_executor.py → engine/instruction_map_engine.py} +80 -55
lionagi/{experimental/directive/evaluator → core/engine}/script_engine.py +17 -1
lionagi/core/executor/base_executor.py +90 -0
lionagi/core/{execute/structure_executor.py → executor/graph_executor.py} +83 -67
lionagi/core/{execute → executor}/neo4j_executor.py +70 -67
lionagi/core/generic/__init__.py +3 -33
lionagi/core/generic/edge.py +42 -92
lionagi/core/generic/edge_condition.py +16 -0
lionagi/core/generic/graph.py +236 -0
lionagi/core/generic/hyperedge.py +1 -0
lionagi/core/generic/node.py +156 -221
lionagi/core/generic/tree.py +48 -0
lionagi/core/generic/tree_node.py +79 -0
lionagi/core/mail/__init__.py +12 -0
lionagi/core/mail/mail.py +25 -0
lionagi/core/mail/mail_manager.py +139 -58
lionagi/core/mail/package.py +45 -0
lionagi/core/mail/start_mail.py +36 -0
lionagi/core/message/__init__.py +19 -0
lionagi/core/message/action_request.py +133 -0
lionagi/core/message/action_response.py +135 -0
lionagi/core/message/assistant_response.py +95 -0
lionagi/core/message/instruction.py +234 -0
lionagi/core/message/message.py +101 -0
lionagi/core/message/system.py +86 -0
lionagi/core/message/util.py +283 -0
lionagi/core/report/__init__.py +4 -0
lionagi/core/report/base.py +217 -0
lionagi/core/report/form.py +231 -0
lionagi/core/report/report.py +166 -0
lionagi/core/report/util.py +28 -0
lionagi/core/rule/_default.py +16 -0
lionagi/core/rule/action.py +99 -0
lionagi/core/rule/base.py +238 -0
lionagi/core/rule/boolean.py +56 -0
lionagi/core/rule/choice.py +47 -0
lionagi/core/rule/mapping.py +96 -0
lionagi/core/rule/number.py +71 -0
lionagi/core/rule/rulebook.py +109 -0
lionagi/core/rule/string.py +52 -0
lionagi/core/rule/util.py +35 -0
lionagi/core/session/branch.py +431 -0
lionagi/core/session/directive_mixin.py +287 -0
lionagi/core/session/session.py +229 -903
lionagi/core/structure/__init__.py +1 -0
lionagi/core/structure/chain.py +1 -0
lionagi/core/structure/forest.py +1 -0
lionagi/core/structure/graph.py +1 -0
lionagi/core/structure/tree.py +1 -0
lionagi/core/unit/__init__.py +5 -0
lionagi/core/unit/parallel_unit.py +245 -0
lionagi/core/unit/template/action.py +81 -0
lionagi/core/unit/template/base.py +51 -0
lionagi/core/unit/template/plan.py +84 -0
lionagi/core/unit/template/predict.py +109 -0
lionagi/core/unit/template/score.py +124 -0
lionagi/core/unit/template/select.py +104 -0
lionagi/core/unit/unit.py +362 -0
lionagi/core/unit/unit_form.py +305 -0
lionagi/core/unit/unit_mixin.py +1168 -0
lionagi/core/unit/util.py +71 -0
lionagi/core/validator/validator.py +364 -0
lionagi/core/work/work.py +74 -0
lionagi/core/work/work_function.py +92 -0
lionagi/core/work/work_queue.py +81 -0
lionagi/core/work/worker.py +195 -0
lionagi/core/work/worklog.py +124 -0
lionagi/experimental/compressor/base.py +46 -0
lionagi/experimental/compressor/llm_compressor.py +247 -0
lionagi/experimental/compressor/llm_summarizer.py +61 -0
lionagi/experimental/compressor/util.py +70 -0
lionagi/experimental/directive/__init__.py +19 -0
lionagi/experimental/directive/parser/base_parser.py +69 -2
lionagi/experimental/directive/{template_ → template}/base_template.py +17 -1
lionagi/{libs/ln_tokenizer.py → experimental/directive/tokenizer.py} +16 -0
lionagi/experimental/{directive/evaluator → evaluator}/ast_evaluator.py +16 -0
lionagi/experimental/{directive/evaluator → evaluator}/base_evaluator.py +16 -0
lionagi/experimental/knowledge/__init__.py +0 -0
lionagi/experimental/knowledge/base.py +10 -0
lionagi/experimental/knowledge/graph.py +0 -0
lionagi/experimental/memory/__init__.py +0 -0
lionagi/experimental/strategies/__init__.py +0 -0
lionagi/experimental/strategies/base.py +1 -0
lionagi/integrations/bridge/langchain_/documents.py +4 -0
lionagi/integrations/bridge/llamaindex_/index.py +30 -0
lionagi/integrations/bridge/llamaindex_/llama_index_bridge.py +6 -0
lionagi/integrations/chunker/chunk.py +161 -24
lionagi/integrations/config/oai_configs.py +34 -3
lionagi/integrations/config/openrouter_configs.py +14 -2
lionagi/integrations/loader/load.py +122 -21
lionagi/integrations/loader/load_util.py +6 -77
lionagi/integrations/provider/_mapping.py +46 -0
lionagi/integrations/provider/litellm.py +2 -1
lionagi/integrations/provider/mlx_service.py +16 -9
lionagi/integrations/provider/oai.py +91 -4
lionagi/integrations/provider/ollama.py +6 -5
lionagi/integrations/provider/openrouter.py +115 -8
lionagi/integrations/provider/services.py +2 -2
lionagi/integrations/provider/transformers.py +18 -22
lionagi/integrations/storage/__init__.py +3 -3
lionagi/integrations/storage/neo4j.py +52 -60
lionagi/integrations/storage/storage_util.py +45 -47
lionagi/integrations/storage/structure_excel.py +285 -0
lionagi/integrations/storage/to_excel.py +23 -7
lionagi/libs/__init__.py +26 -1
lionagi/libs/ln_api.py +75 -20
lionagi/libs/ln_context.py +37 -0
lionagi/libs/ln_convert.py +21 -9
lionagi/libs/ln_func_call.py +69 -28
lionagi/libs/ln_image.py +107 -0
lionagi/libs/ln_nested.py +26 -11
lionagi/libs/ln_parse.py +82 -23
lionagi/libs/ln_queue.py +16 -0
lionagi/libs/ln_tokenize.py +164 -0
lionagi/libs/ln_validate.py +16 -0
lionagi/libs/special_tokens.py +172 -0
lionagi/libs/sys_util.py +95 -24
lionagi/lions/coder/code_form.py +13 -0
lionagi/lions/coder/coder.py +50 -3
lionagi/lions/coder/util.py +30 -25
lionagi/tests/libs/test_func_call.py +23 -21
lionagi/tests/libs/test_nested.py +36 -21
lionagi/tests/libs/test_parse.py +1 -1
lionagi/tests/test_core/collections/__init__.py +0 -0
lionagi/tests/test_core/collections/test_component.py +206 -0
lionagi/tests/test_core/collections/test_exchange.py +138 -0
lionagi/tests/test_core/collections/test_flow.py +145 -0
lionagi/tests/test_core/collections/test_pile.py +171 -0
lionagi/tests/test_core/collections/test_progression.py +129 -0
lionagi/tests/test_core/generic/__init__.py +0 -0
lionagi/tests/test_core/generic/test_edge.py +67 -0
lionagi/tests/test_core/generic/test_graph.py +96 -0
lionagi/tests/test_core/generic/test_node.py +106 -0
lionagi/tests/test_core/generic/test_tree_node.py +73 -0
lionagi/tests/test_core/test_branch.py +115 -294
lionagi/tests/test_core/test_form.py +46 -0
lionagi/tests/test_core/test_report.py +105 -0
lionagi/tests/test_core/test_validator.py +111 -0
lionagi/version.py +1 -1
lionagi-0.2.0.dist-info/LICENSE +202 -0
lionagi-0.2.0.dist-info/METADATA +272 -0
lionagi-0.2.0.dist-info/RECORD +240 -0
lionagi/core/branch/base.py +0 -653
lionagi/core/branch/branch.py +0 -474
lionagi/core/branch/flow_mixin.py +0 -96
lionagi/core/branch/util.py +0 -323
lionagi/core/direct/__init__.py +0 -19
lionagi/core/direct/cot.py +0 -123
lionagi/core/direct/plan.py +0 -164
lionagi/core/direct/predict.py +0 -166
lionagi/core/direct/react.py +0 -171
lionagi/core/direct/score.py +0 -279
lionagi/core/direct/select.py +0 -170
lionagi/core/direct/sentiment.py +0 -1
lionagi/core/direct/utils.py +0 -110
lionagi/core/direct/vote.py +0 -64
lionagi/core/execute/base_executor.py +0 -47
lionagi/core/flow/baseflow.py +0 -23
lionagi/core/flow/monoflow/ReAct.py +0 -238
lionagi/core/flow/monoflow/__init__.py +0 -9
lionagi/core/flow/monoflow/chat.py +0 -95
lionagi/core/flow/monoflow/chat_mixin.py +0 -253
lionagi/core/flow/monoflow/followup.py +0 -213
lionagi/core/flow/polyflow/__init__.py +0 -1
lionagi/core/flow/polyflow/chat.py +0 -251
lionagi/core/form/action_form.py +0 -26
lionagi/core/form/field_validator.py +0 -287
lionagi/core/form/form.py +0 -302
lionagi/core/form/mixin.py +0 -214
lionagi/core/form/scored_form.py +0 -13
lionagi/core/generic/action.py +0 -26
lionagi/core/generic/component.py +0 -455
lionagi/core/generic/condition.py +0 -44
lionagi/core/generic/mail.py +0 -90
lionagi/core/generic/mailbox.py +0 -36
lionagi/core/generic/relation.py +0 -70
lionagi/core/generic/signal.py +0 -22
lionagi/core/generic/structure.py +0 -362
lionagi/core/generic/transfer.py +0 -20
lionagi/core/generic/work.py +0 -40
lionagi/core/graph/graph.py +0 -126
lionagi/core/graph/tree.py +0 -190
lionagi/core/mail/schema.py +0 -63
lionagi/core/messages/schema.py +0 -325
lionagi/core/tool/__init__.py +0 -5
lionagi/core/tool/tool.py +0 -28
lionagi/core/tool/tool_manager.py +0 -282
lionagi/experimental/tool/function_calling.py +0 -43
lionagi/experimental/tool/manual.py +0 -66
lionagi/experimental/tool/schema.py +0 -59
lionagi/experimental/tool/tool_manager.py +0 -138
lionagi/experimental/tool/util.py +0 -16
lionagi/experimental/work/_logger.py +0 -25
lionagi/experimental/work/schema.py +0 -30
lionagi/experimental/work/tests.py +0 -72
lionagi/experimental/work/work_function.py +0 -89
lionagi/experimental/work/worker.py +0 -12
lionagi/integrations/bridge/llamaindex_/get_index.py +0 -294
lionagi/tests/test_core/test_base_branch.py +0 -426
lionagi/tests/test_core/test_chat_flow.py +0 -63
lionagi/tests/test_core/test_mail_manager.py +0 -75
lionagi/tests/test_core/test_prompts.py +0 -51
lionagi/tests/test_core/test_session.py +0 -254
lionagi/tests/test_core/test_session_base_util.py +0 -313
lionagi/tests/test_core/test_tool_manager.py +0 -95
lionagi-0.1.1.dist-info/LICENSE +0 -9
lionagi-0.1.1.dist-info/METADATA +0 -174
lionagi-0.1.1.dist-info/RECORD +0 -190
/lionagi/core/{branch → _setting}/__init__.py +0 -0
/lionagi/core/{execute → agent/eval}/__init__.py +0 -0
/lionagi/core/{flow → agent/learn}/__init__.py +0 -0
/lionagi/core/{form → agent/plan}/__init__.py +0 -0
/lionagi/core/{branch/executable_branch.py → agent/plan/plan.py} +0 -0
/lionagi/core/{graph → director}/__init__.py +0 -0
/lionagi/core/{messages → engine}/__init__.py +0 -0
/lionagi/{experimental/directive/evaluator → core/engine}/sandbox_.py +0 -0
/lionagi/{experimental/directive/evaluator → core/executor}/__init__.py +0 -0
/lionagi/{experimental/directive/template_ → core/rule}/__init__.py +0 -0
/lionagi/{experimental/tool → core/unit/template}/__init__.py +0 -0
/lionagi/{experimental/work → core/validator}/__init__.py +0 -0
/lionagi/core/{flow/mono_chat_mixin.py → work/__init__.py} +0 -0
/lionagi/experimental/{work/exchange.py → compressor/__init__.py} +0 -0
/lionagi/experimental/{work/util.py → directive/template/__init__.py} +0 -0
/lionagi/experimental/directive/{schema.py → template/schema.py} +0 -0
/lionagi/{tests/libs/test_async.py → experimental/evaluator/__init__.py} +0 -0
{lionagi-0.1.1.dist-info → lionagi-0.2.0.dist-info}/WHEEL +0 -0
{lionagi-0.1.1.dist-info → lionagi-0.2.0.dist-info}/top_level.txt +0 -0

lionagi/integrations/chunker/chunk.py CHANGED Viewed

@@ -1,6 +1,8 @@
 from typing import Union, Callable
 from lionagi.libs import func_call
+from lionagi.libs.ln_convert import to_list
+from lionagi.core.collections import pile
 from lionagi.core.generic import Node
 from ..bridge.langchain_.langchain_bridge import LangchainBridge
 from ..bridge.llamaindex_.llama_index_bridge import LlamaIndexBridge
@@ -10,7 +12,20 @@ from ..loader.load_util import ChunkerType, file_to_chunks, _datanode_parser
 def datanodes_convert(documents, chunker_type):
+    """
+    Converts documents to the specified chunker type.
+    Args:
+        documents (list): List of documents to be converted.
+        chunker_type (ChunkerType): The type of chunker to convert the documents to.
+    Returns:
+        list: The converted documents.
+    Example usage:
+        >>> documents = [Node(...), Node(...)]
+        >>> converted_docs = datanodes_convert(documents, ChunkerType.LLAMAINDEX)
+    """
     for i in range(len(documents)):
         if type(documents[i]) == Node:
             if chunker_type == ChunkerType.LLAMAINDEX:
@@ -21,25 +36,71 @@ def datanodes_convert(documents, chunker_type):
 def text_chunker(documents, args, kwargs):
+    """
+    Chunks text documents into smaller pieces.
+    Args:
+        documents (list): List of documents to be chunked.
+        args (tuple): Positional arguments for the chunking function.
+        kwargs (dict): Keyword arguments for the chunking function.
+    Returns:
+        pile: A pile of chunked Node instances.
+    Example usage:
+        >>> documents = [Node(...), Node(...)]
+        >>> chunked_docs = text_chunker(documents, args, kwargs)
+    """
     def chunk_node(node):
         chunks = file_to_chunks(node.to_dict(), *args, **kwargs)
-        func_call.lcall(chunks, lambda chunk: chunk.pop("node_id"))
+        func_call.lcall(chunks, lambda chunk: chunk.pop("ln_id"))
         return [Node.from_obj({**chunk}) for chunk in chunks]
-    return [chunk_node(doc) for doc in documents]
+    a = to_list([chunk_node(doc) for doc in documents], flatten=True, dropna=True)
+    return pile(a)
 def chunk(
-    documents,
-    chunker,
+    docs,
+    field: str = "content",
+    chunk_size: int = 1500,
+    overlap: float = 0.1,
+    threshold: int = 200,
+    chunker="text_chunker",
     chunker_type=ChunkerType.PLAIN,
     chunker_args=None,
     chunker_kwargs=None,
     chunking_kwargs=None,
     documents_convert_func=None,
-    to_datanode: bool | Callable = True,
+    to_lion: bool | Callable = True,
 ):
+    """
+    Chunks documents using the specified chunker.
+    Args:
+        docs (list): List of documents to be chunked.
+        field (str, optional): The field to chunk. Defaults to "content".
+        chunk_size (int, optional): The size of each chunk. Defaults to 1500.
+        overlap (float, optional): The overlap between chunks. Defaults to 0.1.
+        threshold (int, optional): The threshold for chunking. Defaults to 200.
+        chunker (str, optional): The chunker function or its name. Defaults to "text_chunker".
+        chunker_type (ChunkerType, optional): The type of chunker to use. Defaults to ChunkerType.PLAIN.
+        chunker_args (list, optional): Positional arguments for the chunker function. Defaults to None.
+        chunker_kwargs (dict, optional): Keyword arguments for the chunker function. Defaults to None.
+        chunking_kwargs (dict, optional): Additional keyword arguments for chunking. Defaults to None.
+        documents_convert_func (Callable, optional): Function to convert documents. Defaults to None.
+        to_lion (bool | Callable, optional): Whether to convert the data to Node instances or a custom parser. Defaults to True.
+    Returns:
+        pile: A pile of chunked Node instances.
+    Raises:
+        ValueError: If the chunker_type is not supported.
+    Example usage:
+        >>> chunked_docs = chunk(docs, field='text', chunk_size=1000, overlap=0.2)
+    """
     if chunker_args is None:
         chunker_args = []
@@ -49,38 +110,42 @@ def chunk(
         chunking_kwargs = {}
     if chunker_type == ChunkerType.PLAIN:
+        chunker_kwargs["field"] = field
+        chunker_kwargs["chunk_size"] = chunk_size
+        chunker_kwargs["overlap"] = overlap
+        chunker_kwargs["threshold"] = threshold
         return chunk_funcs[ChunkerType.PLAIN](
-            documents, chunker, chunker_args, chunker_kwargs
+            docs, chunker, chunker_args, chunker_kwargs
         )
     elif chunker_type == ChunkerType.LANGCHAIN:
         return chunk_funcs[ChunkerType.LANGCHAIN](
-            documents,
+            docs,
             documents_convert_func,
             chunker,
             chunker_args,
             chunker_kwargs,
-            to_datanode,
+            to_lion,
         )
     elif chunker_type == ChunkerType.LLAMAINDEX:
         return chunk_funcs[ChunkerType.LLAMAINDEX](
-            documents,
+            docs,
             documents_convert_func,
             chunker,
             chunker_args,
             chunker_kwargs,
-            to_datanode,
+            to_lion,
         )
     elif chunker_type == ChunkerType.SELFDEFINED:
         return chunk_funcs[ChunkerType.SELFDEFINED](
-            documents,
+            docs,
             chunker,
             chunker_args,
             chunker_kwargs,
             chunking_kwargs,
-            to_datanode,
+            to_lion,
         )
     else:
@@ -95,8 +160,28 @@ def _self_defined_chunker(
     chunker_args,
     chunker_kwargs,
     chunking_kwargs,
-    to_datanode: bool | Callable,
+    to_lion: bool | Callable,
 ):
+    """
+    Chunks documents using a self-defined chunker.
+    Args:
+        documents (list): List of documents to be chunked.
+        chunker (str | Callable): The chunker function or its name.
+        chunker_args (list): Positional arguments for the chunker function.
+        chunker_kwargs (dict): Keyword arguments for the chunker function.
+        chunking_kwargs (dict): Additional keyword arguments for chunking.
+        to_lion (bool | Callable): Whether to convert the data to Node instances or a custom parser.
+    Returns:
+        pile: A pile of chunked Node instances or custom parsed nodes.
+    Raises:
+        ValueError: If the self-defined chunker is not valid.
+    Example usage:
+        >>> chunked_docs = _self_defined_chunker(docs, custom_chunker, ['arg1'], {'key': 'value'}, {}, custom_parser)
+    """
     try:
         splitter = chunker(*chunker_args, **chunker_kwargs)
         nodes = splitter.split(documents, **chunking_kwargs)
@@ -105,10 +190,10 @@ def _self_defined_chunker(
             f"Self defined chunker {chunker} is not valid. Error: {e}"
         ) from e
-    if isinstance(to_datanode, bool) and to_datanode is True:
+    if isinstance(to_lion, bool) and to_lion is True:
         raise ValueError("Please define a valid parser to Node.")
-    elif isinstance(to_datanode, Callable):
-        nodes = _datanode_parser(nodes, to_datanode)
+    elif isinstance(to_lion, Callable):
+        nodes = _datanode_parser(nodes, to_lion)
     return nodes
@@ -118,18 +203,35 @@ def _llama_index_chunker(
     chunker,
     chunker_args,
     chunker_kwargs,
-    to_datanode: bool | Callable,
+    to_lion: bool | Callable,
 ):
+    """
+    Chunks documents using a LlamaIndex chunker.
+    Args:
+        documents (list): List of documents to be chunked.
+        documents_convert_func (Callable): Function to convert documents.
+        chunker (str | Callable): The chunker function or its name.
+        chunker_args (list): Positional arguments for the chunker function.
+        chunker_kwargs (dict): Keyword arguments for the chunker function.
+        to_lion (bool | Callable): Whether to convert the data to Node instances or a custom parser.
+    Returns:
+        pile: A pile of chunked Node instances or custom parsed nodes.
+    Example usage:
+        >>> chunked_docs = _llama_index_chunker(docs, convert_func, llama_chunker, ['arg1'], {'key': 'value'}, True)
+    """
     if documents_convert_func:
         documents = documents_convert_func(documents, "llama_index")
     nodes = LlamaIndexBridge.llama_index_parse_node(
         documents, chunker, chunker_args, chunker_kwargs
     )
-    if isinstance(to_datanode, bool) and to_datanode is True:
+    if isinstance(to_lion, bool) and to_lion is True:
         nodes = [Node.from_llama_index(i) for i in nodes]
-    elif isinstance(to_datanode, Callable):
-        nodes = _datanode_parser(nodes, to_datanode)
+    elif isinstance(to_lion, Callable):
+        nodes = _datanode_parser(nodes, to_lion)
     return nodes
@@ -139,24 +241,59 @@ def _langchain_chunker(
     chunker,
     chunker_args,
     chunker_kwargs,
-    to_datanode: bool | Callable,
+    to_lion: bool | Callable,
 ):
+    """
+    Chunks documents using a Langchain chunker.
+    Args:
+        documents (list): List of documents to be chunked.
+        documents_convert_func (Callable): Function to convert documents.
+        chunker (str | Callable): The chunker function or its name.
+        chunker_args (list): Positional arguments for the chunker function.
+        chunker_kwargs (dict): Keyword arguments for the chunker function.
+        to_lion (bool | Callable): Whether to convert the data to Node instances or a custom parser.
+    Returns:
+        pile: A pile of chunked Node instances or custom parsed nodes.
+    Example usage:
+        >>> chunked_docs = _langchain_chunker(docs, convert_func, langchain_chunker, ['arg1'], {'key': 'value'}, True)
+    """
     if documents_convert_func:
         documents = documents_convert_func(documents, "langchain")
     nodes = LangchainBridge.langchain_text_splitter(
         documents, chunker, chunker_args, chunker_kwargs
     )
-    if isinstance(to_datanode, bool) and to_datanode is True:
+    if isinstance(to_lion, bool) and to_lion is True:
         if isinstance(documents, str):
             nodes = [Node(content=i) for i in nodes]
         else:
             nodes = [Node.from_langchain(i) for i in nodes]
-    elif isinstance(to_datanode, Callable):
-        nodes = _datanode_parser(nodes, to_datanode)
+    elif isinstance(to_lion, Callable):
+        nodes = _datanode_parser(nodes, to_lion)
     return nodes
 def _plain_chunker(documents, chunker, chunker_args, chunker_kwargs):
+    """
+    Chunks documents using a plain chunker.
+    Args:
+        documents (list): List of documents to be chunked.
+        chunker (str | Callable): The chunker function or its name.
+        chunker_args (list): Positional arguments for the chunker function.
+        chunker_kwargs (dict): Keyword arguments for the chunker function.
+    Returns:
+        pile: A pile of chunked Node instances.
+    Raises:
+        ValueError: If the chunker is not supported.
+    Example usage:
+        >>> chunked_docs = _plain_chunker(docs, 'text_chunker', ['arg1'], {'key': 'value'})
+    """
     try:
         if chunker == "text_chunker":
             chunker = text_chunker

lionagi/integrations/config/oai_configs.py CHANGED Viewed

@@ -1,8 +1,10 @@
 # Default configs for the OpenAI API
+API_key_schema = ("OPENAI_API_KEY",)
 # ChatCompletion
 oai_chat_llmconfig = {
-    "model": "gpt-4-turbo",
+    "model": "gpt-4o",
     "frequency_penalty": 0,
     "max_tokens": None,
     "n": 1,
@@ -11,11 +13,13 @@ oai_chat_llmconfig = {
     "seed": None,
     "stop": None,
     "stream": False,
-    "temperature": 0.7,
+    "temperature": 0.1,
     "top_p": 1,
     "tools": None,
     "tool_choice": "none",
     "user": None,
+    "logprobs": False,
+    "top_logprobs": None,
 }
 oai_chat_schema = {
@@ -36,9 +40,16 @@ oai_chat_schema = {
         "tool_choice",
         "user",
         "max_tokens",
+        "logprobs",
+        "top_logprobs",
     ],
     "input_": "messages",
     "config": oai_chat_llmconfig,
+    "token_encoding_name": "cl100k_base",
+    "token_limit": 128_000,
+    "interval_tokens": 1_000_000,
+    "interval_requests": 1_000,
+    "interval": 60,
 }
 # Finetune
@@ -111,8 +122,26 @@ oai_audio_translations_schema = {
     "config": oai_audio_translations_llmconfig,
 }
-# images
+# embeddings
+oai_embeddings_llmconfig = {
+    "model": "text-embedding-ada-002",
+    "encoding_format": "float",
+    "user": None,
+    "dimensions": None,
+}
+oai_embeddings_schema = {
+    "required": ["model", "encoding_format"],
+    "optional": ["user", "dimensions"],
+    "input_": "input",
+    "config": oai_embeddings_llmconfig,
+    "token_encoding_name": "cl100k_base",
+    "token_limit": 8192,
+    "interval_tokens": 1_000_000,
+    "interval_requests": 1_000,
+    "interval": 60,
+}
 oai_schema = {
     "chat/completions": oai_chat_schema,
@@ -120,4 +149,6 @@ oai_schema = {
     "audio_speech": oai_audio_speech_schema,
     "audio_transcriptions": oai_audio_transcriptions_schema,
     "audio_translations": oai_audio_translations_schema,
+    "API_key_schema": API_key_schema,
+    "embeddings": oai_embeddings_schema,
 }

lionagi/integrations/config/openrouter_configs.py CHANGED Viewed

@@ -1,5 +1,7 @@
+API_key_schema = ("OPENROUTER_API_KEY",)
 openrouter_chat_llmconfig = {
-    "model": "gpt-4-turbo",
+    "model": "gpt-4o",
     "frequency_penalty": 0,
     "max_tokens": None,
     "num": 1,
@@ -8,11 +10,13 @@ openrouter_chat_llmconfig = {
     "seed": None,
     "stop": None,
     "stream": False,
-    "temperature": 0.7,
+    "temperature": 0.1,
     "top_p": 1,
     "tools": None,
     "tool_choice": "none",
     "user": None,
+    "logprobs": False,
+    "top_logprobs": None,
 }
 openrouter_chat_schema = {
@@ -33,9 +37,16 @@ openrouter_chat_schema = {
         "tool_choice",
         "user",
         "max_tokens",
+        "logprobs",
+        "top_logprobs",
     ],
     "input_": "messages",
     "config": openrouter_chat_llmconfig,
+    "token_encoding_name": "cl100k_base",
+    "token_limit": 128_000,
+    "interval_tokens": 10_000,
+    "interval_requests": 100,
+    "interval": 60,
 }
 openrouter_finetune_llmconfig = {
@@ -59,4 +70,5 @@ openrouter_finetune_schema = {
 openrouter_schema = {
     "chat/completions": openrouter_chat_schema,
     "finetune": openrouter_finetune_schema,
+    "API_key_schema": API_key_schema,
 }

lionagi/integrations/loader/load.py CHANGED Viewed

@@ -1,6 +1,7 @@
 from typing import Callable
 from lionagi.core.generic import Node
+from lionagi.core.collections import pile
 from ..bridge.langchain_.langchain_bridge import LangchainBridge
 from ..bridge.llamaindex_.llama_index_bridge import LlamaIndexBridge
@@ -27,18 +28,43 @@ def text_reader(args, kwargs):
 def load(
-    reader: str | Callable = "SimpleDirectoryReader",
+    reader: str | Callable = "text_reader",
     input_dir=None,
     input_files=None,
     recursive: bool = False,
     required_exts: list[str] = None,
-    reader_type=ReaderType.LLAMAINDEX,
+    reader_type=ReaderType.PLAIN,
     reader_args=None,
     reader_kwargs=None,
     load_args=None,
     load_kwargs=None,
-    to_datanode: bool | Callable = True,
+    to_lion: bool | Callable = True,
 ):
+    """
+    Loads data using the specified reader and converts it to Node instances.
+    Args:
+        reader (str | Callable): The reader function or its name. Defaults to "text_reader".
+        input_dir (str, optional): The directory to read files from. Defaults to None.
+        input_files (list[str], optional): Specific files to read. Defaults to None.
+        recursive (bool, optional): Whether to read files recursively. Defaults to False.
+        required_exts (list[str], optional): List of required file extensions. Defaults to None.
+        reader_type (ReaderType, optional): The type of reader to use. Defaults to ReaderType.PLAIN.
+        reader_args (list, optional): Positional arguments for the reader function. Defaults to None.
+        reader_kwargs (dict, optional): Keyword arguments for the reader function. Defaults to None.
+        load_args (list, optional): Positional arguments for loading. Defaults to None.
+        load_kwargs (dict, optional): Keyword arguments for loading. Defaults to None.
+        to_lion (bool | Callable, optional): Whether to convert the data to Node instances or a custom parser. Defaults to True.
+    Returns:
+        pile: A pile of Node instances.
+    Raises:
+        ValueError: If the reader_type is not supported.
+    Example usage:
+        >>> nodes = load(input_dir='path/to/text/files', required_exts=['txt'])
+    """
     if reader_args is None:
         reader_args = []
@@ -50,11 +76,15 @@ def load(
         load_kwargs = {}
     if reader_type == ReaderType.PLAIN:
+        reader_kwargs["dir_"] = input_dir
+        reader_kwargs["ext"] = required_exts
+        reader_kwargs["recursive"] = recursive
         return read_funcs[ReaderType.PLAIN](reader, reader_args, reader_kwargs)
     if reader_type == ReaderType.LANGCHAIN:
         return read_funcs[ReaderType.LANGCHAIN](
-            reader, reader_args, reader_kwargs, to_datanode
+            reader, reader_args, reader_kwargs, to_lion
         )
     elif reader_type == ReaderType.LLAMAINDEX:
@@ -68,12 +98,12 @@ def load(
             reader_kwargs["required_exts"] = required_exts
         return read_funcs[ReaderType.LLAMAINDEX](
-            reader, reader_args, reader_kwargs, load_args, load_kwargs, to_datanode
+            reader, reader_args, reader_kwargs, load_args, load_kwargs, to_lion
         )
     elif reader_type == ReaderType.SELFDEFINED:
         return read_funcs[ReaderType.SELFDEFINED](
-            reader, reader_args, reader_kwargs, load_args, load_kwargs, to_datanode
+            reader, reader_args, reader_kwargs, load_args, load_kwargs, to_lion
         )
     else:
@@ -83,23 +113,56 @@ def load(
 def _plain_reader(reader, reader_args, reader_kwargs):
+    """
+    Reads data using a plain reader.
+    Args:
+        reader (str | Callable): The reader function or its name.
+        reader_args (list): Positional arguments for the reader function.
+        reader_kwargs (dict): Keyword arguments for the reader function.
+    Returns:
+        pile: A pile of Node instances.
+    Raises:
+        ValueError: If the reader is not supported.
+    Example usage:
+        >>> nodes = _plain_reader('text_reader', ['path/to/files'], {'ext': 'txt'})
+    """
     try:
         if reader == "text_reader":
             reader = text_reader
-        return reader(reader_args, reader_kwargs)
+        nodes = reader(reader_args, reader_kwargs)
+        return pile(nodes)
     except Exception as e:
         raise ValueError(
             f"Reader {reader} is currently not supported. Error: {e}"
         ) from e
-def _langchain_reader(reader, reader_args, reader_kwargs, to_datanode: bool | Callable):
+def _langchain_reader(reader, reader_args, reader_kwargs, to_lion: bool | Callable):
+    """
+    Reads data using a Langchain reader.
+    Args:
+        reader (str | Callable): The reader function or its name.
+        reader_args (list): Positional arguments for the reader function.
+        reader_kwargs (dict): Keyword arguments for the reader function.
+        to_lion (bool | Callable): Whether to convert the data to Node instances or a custom parser.
+    Returns:
+        pile: A pile of Node instances or custom parsed nodes.
+    Example usage:
+        >>> nodes = _langchain_reader('langchain_reader', ['arg1'], {'key': 'value'}, True)
+    """
     nodes = LangchainBridge.langchain_loader(reader, reader_args, reader_kwargs)
-    if isinstance(to_datanode, bool) and to_datanode is True:
-        nodes = [Node.from_langchain(i) for i in nodes]
+    if isinstance(to_lion, bool) and to_lion is True:
+        return pile([Node.from_langchain(i) for i in nodes])
-    elif isinstance(to_datanode, Callable):
-        nodes = _datanode_parser(nodes, to_datanode)
+    elif isinstance(to_lion, Callable):
+        nodes = _datanode_parser(nodes, to_lion)
     return nodes
@@ -109,15 +172,33 @@ def _llama_index_reader(
     reader_kwargs,
     load_args,
     load_kwargs,
-    to_datanode: bool | Callable,
+    to_lion: bool | Callable,
 ):
+    """
+    Reads data using a LlamaIndex reader.
+    Args:
+        reader (str | Callable): The reader function or its name.
+        reader_args (list): Positional arguments for the reader function.
+        reader_kwargs (dict): Keyword arguments for the reader function.
+        load_args (list): Positional arguments for loading.
+        load_kwargs (dict): Keyword arguments for loading.
+        to_lion (bool | Callable): Whether to convert the data to Node instances or a custom parser.
+    Returns:
+        pile: A pile of Node instances or custom parsed nodes.
+    Example usage:
+        >>> nodes = _llama_index_reader('llama_reader', ['arg1'], {'key': 'value'}, [], {}, True)
+    """
     nodes = LlamaIndexBridge.llama_index_read_data(
         reader, reader_args, reader_kwargs, load_args, load_kwargs
     )
-    if isinstance(to_datanode, bool) and to_datanode is True:
-        nodes = [Node.from_llama_index(i) for i in nodes]
-    elif isinstance(to_datanode, Callable):
-        nodes = _datanode_parser(nodes, to_datanode)
+    if isinstance(to_lion, bool) and to_lion is True:
+        return pile([Node.from_llama_index(i) for i in nodes])
+    elif isinstance(to_lion, Callable):
+        nodes = _datanode_parser(nodes, to_lion)
     return nodes
@@ -127,8 +208,28 @@ def _self_defined_reader(
     reader_kwargs,
     load_args,
     load_kwargs,
-    to_datanode: bool | Callable,
+    to_lion: bool | Callable,
 ):
+    """
+    Reads data using a self-defined reader.
+    Args:
+        reader (str | Callable): The reader function or its name.
+        reader_args (list): Positional arguments for the reader function.
+        reader_kwargs (dict): Keyword arguments for the reader function.
+        load_args (list): Positional arguments for loading.
+        load_kwargs (dict): Keyword arguments for loading.
+        to_lion (bool | Callable): Whether to convert the data to Node instances or a custom parser.
+    Returns:
+        pile: A pile of Node instances or custom parsed nodes.
+    Raises:
+        ValueError: If the self-defined reader is not valid.
+    Example usage:
+        >>> nodes = _self_defined_reader(custom_reader, ['arg1'], {'key': 'value'}, [], {}, custom_parser)
+    """
     try:
         loader = reader(*reader_args, **reader_kwargs)
         nodes = loader.load(*load_args, **load_kwargs)
@@ -137,10 +238,10 @@ def _self_defined_reader(
             f"Self defined reader {reader} is not valid. Error: {e}"
         ) from e
-    if isinstance(to_datanode, bool) and to_datanode is True:
+    if isinstance(to_lion, bool) and to_lion is True:
         raise ValueError("Please define a valid parser to Node.")
-    elif isinstance(to_datanode, Callable):
-        nodes = _datanode_parser(nodes, to_datanode)
+    elif isinstance(to_lion, Callable):
+        nodes = _datanode_parser(nodes, to_lion)
     return nodes

lionagi 0.1.1__py3-none-any.whl → 0.2.0__py3-none-any.whl

lionagi 0.1.1py3-none-any.whl → 0.2.0py3-none-any.whl