lionagi 0.1.2__py3-none-any.whl → 0.2.0__py3-none-any.whl

Sign up to get free protection for your applications and to get access to all the features.
Files changed (268) hide show
  1. lionagi/__init__.py +60 -5
  2. lionagi/core/__init__.py +0 -25
  3. lionagi/core/_setting/_setting.py +59 -0
  4. lionagi/core/action/__init__.py +14 -0
  5. lionagi/core/action/function_calling.py +136 -0
  6. lionagi/core/action/manual.py +1 -0
  7. lionagi/core/action/node.py +109 -0
  8. lionagi/core/action/tool.py +114 -0
  9. lionagi/core/action/tool_manager.py +356 -0
  10. lionagi/core/agent/base_agent.py +27 -13
  11. lionagi/core/agent/eval/evaluator.py +1 -0
  12. lionagi/core/agent/eval/vote.py +40 -0
  13. lionagi/core/agent/learn/learner.py +59 -0
  14. lionagi/core/agent/plan/unit_template.py +1 -0
  15. lionagi/core/collections/__init__.py +17 -0
  16. lionagi/core/{generic/data_logger.py → collections/_logger.py} +69 -55
  17. lionagi/core/collections/abc/__init__.py +53 -0
  18. lionagi/core/collections/abc/component.py +615 -0
  19. lionagi/core/collections/abc/concepts.py +297 -0
  20. lionagi/core/collections/abc/exceptions.py +150 -0
  21. lionagi/core/collections/abc/util.py +45 -0
  22. lionagi/core/collections/exchange.py +161 -0
  23. lionagi/core/collections/flow.py +426 -0
  24. lionagi/core/collections/model.py +419 -0
  25. lionagi/core/collections/pile.py +913 -0
  26. lionagi/core/collections/progression.py +236 -0
  27. lionagi/core/collections/util.py +64 -0
  28. lionagi/core/director/direct.py +314 -0
  29. lionagi/core/director/director.py +2 -0
  30. lionagi/core/{execute/branch_executor.py → engine/branch_engine.py} +134 -97
  31. lionagi/core/{execute/instruction_map_executor.py → engine/instruction_map_engine.py} +80 -55
  32. lionagi/{experimental/directive/evaluator → core/engine}/script_engine.py +17 -1
  33. lionagi/core/executor/base_executor.py +90 -0
  34. lionagi/core/{execute/structure_executor.py → executor/graph_executor.py} +62 -66
  35. lionagi/core/{execute → executor}/neo4j_executor.py +70 -67
  36. lionagi/core/generic/__init__.py +3 -33
  37. lionagi/core/generic/edge.py +29 -79
  38. lionagi/core/generic/edge_condition.py +16 -0
  39. lionagi/core/generic/graph.py +236 -0
  40. lionagi/core/generic/hyperedge.py +1 -0
  41. lionagi/core/generic/node.py +156 -221
  42. lionagi/core/generic/tree.py +48 -0
  43. lionagi/core/generic/tree_node.py +79 -0
  44. lionagi/core/mail/__init__.py +12 -0
  45. lionagi/core/mail/mail.py +25 -0
  46. lionagi/core/mail/mail_manager.py +139 -58
  47. lionagi/core/mail/package.py +45 -0
  48. lionagi/core/mail/start_mail.py +36 -0
  49. lionagi/core/message/__init__.py +19 -0
  50. lionagi/core/message/action_request.py +133 -0
  51. lionagi/core/message/action_response.py +135 -0
  52. lionagi/core/message/assistant_response.py +95 -0
  53. lionagi/core/message/instruction.py +234 -0
  54. lionagi/core/message/message.py +101 -0
  55. lionagi/core/message/system.py +86 -0
  56. lionagi/core/message/util.py +283 -0
  57. lionagi/core/report/__init__.py +4 -0
  58. lionagi/core/report/base.py +217 -0
  59. lionagi/core/report/form.py +231 -0
  60. lionagi/core/report/report.py +166 -0
  61. lionagi/core/report/util.py +28 -0
  62. lionagi/core/rule/_default.py +16 -0
  63. lionagi/core/rule/action.py +99 -0
  64. lionagi/core/rule/base.py +238 -0
  65. lionagi/core/rule/boolean.py +56 -0
  66. lionagi/core/rule/choice.py +47 -0
  67. lionagi/core/rule/mapping.py +96 -0
  68. lionagi/core/rule/number.py +71 -0
  69. lionagi/core/rule/rulebook.py +109 -0
  70. lionagi/core/rule/string.py +52 -0
  71. lionagi/core/rule/util.py +35 -0
  72. lionagi/core/session/branch.py +431 -0
  73. lionagi/core/session/directive_mixin.py +287 -0
  74. lionagi/core/session/session.py +229 -903
  75. lionagi/core/structure/__init__.py +1 -0
  76. lionagi/core/structure/chain.py +1 -0
  77. lionagi/core/structure/forest.py +1 -0
  78. lionagi/core/structure/graph.py +1 -0
  79. lionagi/core/structure/tree.py +1 -0
  80. lionagi/core/unit/__init__.py +5 -0
  81. lionagi/core/unit/parallel_unit.py +245 -0
  82. lionagi/core/unit/template/action.py +81 -0
  83. lionagi/core/unit/template/base.py +51 -0
  84. lionagi/core/unit/template/plan.py +84 -0
  85. lionagi/core/unit/template/predict.py +109 -0
  86. lionagi/core/unit/template/score.py +124 -0
  87. lionagi/core/unit/template/select.py +104 -0
  88. lionagi/core/unit/unit.py +362 -0
  89. lionagi/core/unit/unit_form.py +305 -0
  90. lionagi/core/unit/unit_mixin.py +1168 -0
  91. lionagi/core/unit/util.py +71 -0
  92. lionagi/core/validator/validator.py +364 -0
  93. lionagi/core/work/work.py +74 -0
  94. lionagi/core/work/work_function.py +92 -0
  95. lionagi/core/work/work_queue.py +81 -0
  96. lionagi/core/work/worker.py +195 -0
  97. lionagi/core/work/worklog.py +124 -0
  98. lionagi/experimental/compressor/base.py +46 -0
  99. lionagi/experimental/compressor/llm_compressor.py +247 -0
  100. lionagi/experimental/compressor/llm_summarizer.py +61 -0
  101. lionagi/experimental/compressor/util.py +70 -0
  102. lionagi/experimental/directive/__init__.py +19 -0
  103. lionagi/experimental/directive/parser/base_parser.py +69 -2
  104. lionagi/experimental/directive/{template_ → template}/base_template.py +17 -1
  105. lionagi/{libs/ln_tokenizer.py → experimental/directive/tokenizer.py} +16 -0
  106. lionagi/experimental/{directive/evaluator → evaluator}/ast_evaluator.py +16 -0
  107. lionagi/experimental/{directive/evaluator → evaluator}/base_evaluator.py +16 -0
  108. lionagi/experimental/knowledge/base.py +10 -0
  109. lionagi/experimental/memory/__init__.py +0 -0
  110. lionagi/experimental/strategies/__init__.py +0 -0
  111. lionagi/experimental/strategies/base.py +1 -0
  112. lionagi/integrations/bridge/langchain_/documents.py +4 -0
  113. lionagi/integrations/bridge/llamaindex_/index.py +30 -0
  114. lionagi/integrations/bridge/llamaindex_/llama_index_bridge.py +6 -0
  115. lionagi/integrations/chunker/chunk.py +161 -24
  116. lionagi/integrations/config/oai_configs.py +34 -3
  117. lionagi/integrations/config/openrouter_configs.py +14 -2
  118. lionagi/integrations/loader/load.py +122 -21
  119. lionagi/integrations/loader/load_util.py +6 -77
  120. lionagi/integrations/provider/_mapping.py +46 -0
  121. lionagi/integrations/provider/litellm.py +2 -1
  122. lionagi/integrations/provider/mlx_service.py +16 -9
  123. lionagi/integrations/provider/oai.py +91 -4
  124. lionagi/integrations/provider/ollama.py +6 -5
  125. lionagi/integrations/provider/openrouter.py +115 -8
  126. lionagi/integrations/provider/services.py +2 -2
  127. lionagi/integrations/provider/transformers.py +18 -22
  128. lionagi/integrations/storage/__init__.py +3 -3
  129. lionagi/integrations/storage/neo4j.py +52 -60
  130. lionagi/integrations/storage/storage_util.py +44 -46
  131. lionagi/integrations/storage/structure_excel.py +43 -26
  132. lionagi/integrations/storage/to_excel.py +11 -4
  133. lionagi/libs/__init__.py +22 -1
  134. lionagi/libs/ln_api.py +75 -20
  135. lionagi/libs/ln_context.py +37 -0
  136. lionagi/libs/ln_convert.py +21 -9
  137. lionagi/libs/ln_func_call.py +69 -28
  138. lionagi/libs/ln_image.py +107 -0
  139. lionagi/libs/ln_nested.py +26 -11
  140. lionagi/libs/ln_parse.py +82 -23
  141. lionagi/libs/ln_queue.py +16 -0
  142. lionagi/libs/ln_tokenize.py +164 -0
  143. lionagi/libs/ln_validate.py +16 -0
  144. lionagi/libs/special_tokens.py +172 -0
  145. lionagi/libs/sys_util.py +95 -24
  146. lionagi/lions/coder/code_form.py +13 -0
  147. lionagi/lions/coder/coder.py +50 -3
  148. lionagi/lions/coder/util.py +30 -25
  149. lionagi/tests/libs/test_func_call.py +23 -21
  150. lionagi/tests/libs/test_nested.py +36 -21
  151. lionagi/tests/libs/test_parse.py +1 -1
  152. lionagi/tests/test_core/collections/__init__.py +0 -0
  153. lionagi/tests/test_core/collections/test_component.py +206 -0
  154. lionagi/tests/test_core/collections/test_exchange.py +138 -0
  155. lionagi/tests/test_core/collections/test_flow.py +145 -0
  156. lionagi/tests/test_core/collections/test_pile.py +171 -0
  157. lionagi/tests/test_core/collections/test_progression.py +129 -0
  158. lionagi/tests/test_core/generic/test_edge.py +67 -0
  159. lionagi/tests/test_core/generic/test_graph.py +96 -0
  160. lionagi/tests/test_core/generic/test_node.py +106 -0
  161. lionagi/tests/test_core/generic/test_tree_node.py +73 -0
  162. lionagi/tests/test_core/test_branch.py +115 -294
  163. lionagi/tests/test_core/test_form.py +46 -0
  164. lionagi/tests/test_core/test_report.py +105 -0
  165. lionagi/tests/test_core/test_validator.py +111 -0
  166. lionagi/version.py +1 -1
  167. lionagi-0.2.0.dist-info/LICENSE +202 -0
  168. lionagi-0.2.0.dist-info/METADATA +272 -0
  169. lionagi-0.2.0.dist-info/RECORD +240 -0
  170. lionagi/core/branch/base.py +0 -653
  171. lionagi/core/branch/branch.py +0 -474
  172. lionagi/core/branch/flow_mixin.py +0 -96
  173. lionagi/core/branch/util.py +0 -323
  174. lionagi/core/direct/__init__.py +0 -19
  175. lionagi/core/direct/cot.py +0 -123
  176. lionagi/core/direct/plan.py +0 -164
  177. lionagi/core/direct/predict.py +0 -166
  178. lionagi/core/direct/react.py +0 -171
  179. lionagi/core/direct/score.py +0 -279
  180. lionagi/core/direct/select.py +0 -170
  181. lionagi/core/direct/sentiment.py +0 -1
  182. lionagi/core/direct/utils.py +0 -110
  183. lionagi/core/direct/vote.py +0 -64
  184. lionagi/core/execute/base_executor.py +0 -47
  185. lionagi/core/flow/baseflow.py +0 -23
  186. lionagi/core/flow/monoflow/ReAct.py +0 -240
  187. lionagi/core/flow/monoflow/__init__.py +0 -9
  188. lionagi/core/flow/monoflow/chat.py +0 -95
  189. lionagi/core/flow/monoflow/chat_mixin.py +0 -253
  190. lionagi/core/flow/monoflow/followup.py +0 -215
  191. lionagi/core/flow/polyflow/__init__.py +0 -1
  192. lionagi/core/flow/polyflow/chat.py +0 -251
  193. lionagi/core/form/action_form.py +0 -26
  194. lionagi/core/form/field_validator.py +0 -287
  195. lionagi/core/form/form.py +0 -302
  196. lionagi/core/form/mixin.py +0 -214
  197. lionagi/core/form/scored_form.py +0 -13
  198. lionagi/core/generic/action.py +0 -26
  199. lionagi/core/generic/component.py +0 -532
  200. lionagi/core/generic/condition.py +0 -46
  201. lionagi/core/generic/mail.py +0 -90
  202. lionagi/core/generic/mailbox.py +0 -36
  203. lionagi/core/generic/relation.py +0 -70
  204. lionagi/core/generic/signal.py +0 -22
  205. lionagi/core/generic/structure.py +0 -362
  206. lionagi/core/generic/transfer.py +0 -20
  207. lionagi/core/generic/work.py +0 -40
  208. lionagi/core/graph/graph.py +0 -126
  209. lionagi/core/graph/tree.py +0 -190
  210. lionagi/core/mail/schema.py +0 -63
  211. lionagi/core/messages/schema.py +0 -325
  212. lionagi/core/tool/__init__.py +0 -5
  213. lionagi/core/tool/tool.py +0 -28
  214. lionagi/core/tool/tool_manager.py +0 -283
  215. lionagi/experimental/report/form.py +0 -64
  216. lionagi/experimental/report/report.py +0 -138
  217. lionagi/experimental/report/util.py +0 -47
  218. lionagi/experimental/tool/function_calling.py +0 -43
  219. lionagi/experimental/tool/manual.py +0 -66
  220. lionagi/experimental/tool/schema.py +0 -59
  221. lionagi/experimental/tool/tool_manager.py +0 -138
  222. lionagi/experimental/tool/util.py +0 -16
  223. lionagi/experimental/validator/rule.py +0 -139
  224. lionagi/experimental/validator/validator.py +0 -56
  225. lionagi/experimental/work/__init__.py +0 -10
  226. lionagi/experimental/work/async_queue.py +0 -54
  227. lionagi/experimental/work/schema.py +0 -73
  228. lionagi/experimental/work/work_function.py +0 -67
  229. lionagi/experimental/work/worker.py +0 -56
  230. lionagi/experimental/work2/form.py +0 -371
  231. lionagi/experimental/work2/report.py +0 -289
  232. lionagi/experimental/work2/schema.py +0 -30
  233. lionagi/experimental/work2/tests.py +0 -72
  234. lionagi/experimental/work2/work_function.py +0 -89
  235. lionagi/experimental/work2/worker.py +0 -12
  236. lionagi/integrations/bridge/llamaindex_/get_index.py +0 -294
  237. lionagi/tests/test_core/generic/test_component.py +0 -89
  238. lionagi/tests/test_core/test_base_branch.py +0 -426
  239. lionagi/tests/test_core/test_chat_flow.py +0 -63
  240. lionagi/tests/test_core/test_mail_manager.py +0 -75
  241. lionagi/tests/test_core/test_prompts.py +0 -51
  242. lionagi/tests/test_core/test_session.py +0 -254
  243. lionagi/tests/test_core/test_session_base_util.py +0 -313
  244. lionagi/tests/test_core/test_tool_manager.py +0 -95
  245. lionagi-0.1.2.dist-info/LICENSE +0 -9
  246. lionagi-0.1.2.dist-info/METADATA +0 -174
  247. lionagi-0.1.2.dist-info/RECORD +0 -206
  248. /lionagi/core/{branch → _setting}/__init__.py +0 -0
  249. /lionagi/core/{execute → agent/eval}/__init__.py +0 -0
  250. /lionagi/core/{flow → agent/learn}/__init__.py +0 -0
  251. /lionagi/core/{form → agent/plan}/__init__.py +0 -0
  252. /lionagi/core/{branch/executable_branch.py → agent/plan/plan.py} +0 -0
  253. /lionagi/core/{graph → director}/__init__.py +0 -0
  254. /lionagi/core/{messages → engine}/__init__.py +0 -0
  255. /lionagi/{experimental/directive/evaluator → core/engine}/sandbox_.py +0 -0
  256. /lionagi/{experimental/directive/evaluator → core/executor}/__init__.py +0 -0
  257. /lionagi/{experimental/directive/template_ → core/rule}/__init__.py +0 -0
  258. /lionagi/{experimental/report → core/unit/template}/__init__.py +0 -0
  259. /lionagi/{experimental/tool → core/validator}/__init__.py +0 -0
  260. /lionagi/{experimental/validator → core/work}/__init__.py +0 -0
  261. /lionagi/experimental/{work2 → compressor}/__init__.py +0 -0
  262. /lionagi/{core/flow/mono_chat_mixin.py → experimental/directive/template/__init__.py} +0 -0
  263. /lionagi/experimental/directive/{schema.py → template/schema.py} +0 -0
  264. /lionagi/experimental/{work2/util.py → evaluator/__init__.py} +0 -0
  265. /lionagi/experimental/{work2/work.py → knowledge/__init__.py} +0 -0
  266. /lionagi/{tests/libs/test_async.py → experimental/knowledge/graph.py} +0 -0
  267. {lionagi-0.1.2.dist-info → lionagi-0.2.0.dist-info}/WHEEL +0 -0
  268. {lionagi-0.1.2.dist-info → lionagi-0.2.0.dist-info}/top_level.txt +0 -0
@@ -1,8 +1,10 @@
1
1
  # Default configs for the OpenAI API
2
2
 
3
+ API_key_schema = ("OPENAI_API_KEY",)
4
+
3
5
  # ChatCompletion
4
6
  oai_chat_llmconfig = {
5
- "model": "gpt-4-turbo",
7
+ "model": "gpt-4o",
6
8
  "frequency_penalty": 0,
7
9
  "max_tokens": None,
8
10
  "n": 1,
@@ -11,11 +13,13 @@ oai_chat_llmconfig = {
11
13
  "seed": None,
12
14
  "stop": None,
13
15
  "stream": False,
14
- "temperature": 0.7,
16
+ "temperature": 0.1,
15
17
  "top_p": 1,
16
18
  "tools": None,
17
19
  "tool_choice": "none",
18
20
  "user": None,
21
+ "logprobs": False,
22
+ "top_logprobs": None,
19
23
  }
20
24
 
21
25
  oai_chat_schema = {
@@ -36,9 +40,16 @@ oai_chat_schema = {
36
40
  "tool_choice",
37
41
  "user",
38
42
  "max_tokens",
43
+ "logprobs",
44
+ "top_logprobs",
39
45
  ],
40
46
  "input_": "messages",
41
47
  "config": oai_chat_llmconfig,
48
+ "token_encoding_name": "cl100k_base",
49
+ "token_limit": 128_000,
50
+ "interval_tokens": 1_000_000,
51
+ "interval_requests": 1_000,
52
+ "interval": 60,
42
53
  }
43
54
 
44
55
  # Finetune
@@ -111,8 +122,26 @@ oai_audio_translations_schema = {
111
122
  "config": oai_audio_translations_llmconfig,
112
123
  }
113
124
 
114
- # images
125
+ # embeddings
115
126
 
127
+ oai_embeddings_llmconfig = {
128
+ "model": "text-embedding-ada-002",
129
+ "encoding_format": "float",
130
+ "user": None,
131
+ "dimensions": None,
132
+ }
133
+
134
+ oai_embeddings_schema = {
135
+ "required": ["model", "encoding_format"],
136
+ "optional": ["user", "dimensions"],
137
+ "input_": "input",
138
+ "config": oai_embeddings_llmconfig,
139
+ "token_encoding_name": "cl100k_base",
140
+ "token_limit": 8192,
141
+ "interval_tokens": 1_000_000,
142
+ "interval_requests": 1_000,
143
+ "interval": 60,
144
+ }
116
145
 
117
146
  oai_schema = {
118
147
  "chat/completions": oai_chat_schema,
@@ -120,4 +149,6 @@ oai_schema = {
120
149
  "audio_speech": oai_audio_speech_schema,
121
150
  "audio_transcriptions": oai_audio_transcriptions_schema,
122
151
  "audio_translations": oai_audio_translations_schema,
152
+ "API_key_schema": API_key_schema,
153
+ "embeddings": oai_embeddings_schema,
123
154
  }
@@ -1,5 +1,7 @@
1
+ API_key_schema = ("OPENROUTER_API_KEY",)
2
+
1
3
  openrouter_chat_llmconfig = {
2
- "model": "gpt-4-turbo",
4
+ "model": "gpt-4o",
3
5
  "frequency_penalty": 0,
4
6
  "max_tokens": None,
5
7
  "num": 1,
@@ -8,11 +10,13 @@ openrouter_chat_llmconfig = {
8
10
  "seed": None,
9
11
  "stop": None,
10
12
  "stream": False,
11
- "temperature": 0.7,
13
+ "temperature": 0.1,
12
14
  "top_p": 1,
13
15
  "tools": None,
14
16
  "tool_choice": "none",
15
17
  "user": None,
18
+ "logprobs": False,
19
+ "top_logprobs": None,
16
20
  }
17
21
 
18
22
  openrouter_chat_schema = {
@@ -33,9 +37,16 @@ openrouter_chat_schema = {
33
37
  "tool_choice",
34
38
  "user",
35
39
  "max_tokens",
40
+ "logprobs",
41
+ "top_logprobs",
36
42
  ],
37
43
  "input_": "messages",
38
44
  "config": openrouter_chat_llmconfig,
45
+ "token_encoding_name": "cl100k_base",
46
+ "token_limit": 128_000,
47
+ "interval_tokens": 10_000,
48
+ "interval_requests": 100,
49
+ "interval": 60,
39
50
  }
40
51
 
41
52
  openrouter_finetune_llmconfig = {
@@ -59,4 +70,5 @@ openrouter_finetune_schema = {
59
70
  openrouter_schema = {
60
71
  "chat/completions": openrouter_chat_schema,
61
72
  "finetune": openrouter_finetune_schema,
73
+ "API_key_schema": API_key_schema,
62
74
  }
@@ -1,6 +1,7 @@
1
1
  from typing import Callable
2
2
 
3
3
  from lionagi.core.generic import Node
4
+ from lionagi.core.collections import pile
4
5
  from ..bridge.langchain_.langchain_bridge import LangchainBridge
5
6
  from ..bridge.llamaindex_.llama_index_bridge import LlamaIndexBridge
6
7
 
@@ -27,18 +28,43 @@ def text_reader(args, kwargs):
27
28
 
28
29
 
29
30
  def load(
30
- reader: str | Callable = "SimpleDirectoryReader",
31
+ reader: str | Callable = "text_reader",
31
32
  input_dir=None,
32
33
  input_files=None,
33
34
  recursive: bool = False,
34
35
  required_exts: list[str] = None,
35
- reader_type=ReaderType.LLAMAINDEX,
36
+ reader_type=ReaderType.PLAIN,
36
37
  reader_args=None,
37
38
  reader_kwargs=None,
38
39
  load_args=None,
39
40
  load_kwargs=None,
40
- to_datanode: bool | Callable = True,
41
+ to_lion: bool | Callable = True,
41
42
  ):
43
+ """
44
+ Loads data using the specified reader and converts it to Node instances.
45
+
46
+ Args:
47
+ reader (str | Callable): The reader function or its name. Defaults to "text_reader".
48
+ input_dir (str, optional): The directory to read files from. Defaults to None.
49
+ input_files (list[str], optional): Specific files to read. Defaults to None.
50
+ recursive (bool, optional): Whether to read files recursively. Defaults to False.
51
+ required_exts (list[str], optional): List of required file extensions. Defaults to None.
52
+ reader_type (ReaderType, optional): The type of reader to use. Defaults to ReaderType.PLAIN.
53
+ reader_args (list, optional): Positional arguments for the reader function. Defaults to None.
54
+ reader_kwargs (dict, optional): Keyword arguments for the reader function. Defaults to None.
55
+ load_args (list, optional): Positional arguments for loading. Defaults to None.
56
+ load_kwargs (dict, optional): Keyword arguments for loading. Defaults to None.
57
+ to_lion (bool | Callable, optional): Whether to convert the data to Node instances or a custom parser. Defaults to True.
58
+
59
+ Returns:
60
+ pile: A pile of Node instances.
61
+
62
+ Raises:
63
+ ValueError: If the reader_type is not supported.
64
+
65
+ Example usage:
66
+ >>> nodes = load(input_dir='path/to/text/files', required_exts=['txt'])
67
+ """
42
68
 
43
69
  if reader_args is None:
44
70
  reader_args = []
@@ -50,11 +76,15 @@ def load(
50
76
  load_kwargs = {}
51
77
 
52
78
  if reader_type == ReaderType.PLAIN:
79
+ reader_kwargs["dir_"] = input_dir
80
+ reader_kwargs["ext"] = required_exts
81
+ reader_kwargs["recursive"] = recursive
82
+
53
83
  return read_funcs[ReaderType.PLAIN](reader, reader_args, reader_kwargs)
54
84
 
55
85
  if reader_type == ReaderType.LANGCHAIN:
56
86
  return read_funcs[ReaderType.LANGCHAIN](
57
- reader, reader_args, reader_kwargs, to_datanode
87
+ reader, reader_args, reader_kwargs, to_lion
58
88
  )
59
89
 
60
90
  elif reader_type == ReaderType.LLAMAINDEX:
@@ -68,12 +98,12 @@ def load(
68
98
  reader_kwargs["required_exts"] = required_exts
69
99
 
70
100
  return read_funcs[ReaderType.LLAMAINDEX](
71
- reader, reader_args, reader_kwargs, load_args, load_kwargs, to_datanode
101
+ reader, reader_args, reader_kwargs, load_args, load_kwargs, to_lion
72
102
  )
73
103
 
74
104
  elif reader_type == ReaderType.SELFDEFINED:
75
105
  return read_funcs[ReaderType.SELFDEFINED](
76
- reader, reader_args, reader_kwargs, load_args, load_kwargs, to_datanode
106
+ reader, reader_args, reader_kwargs, load_args, load_kwargs, to_lion
77
107
  )
78
108
 
79
109
  else:
@@ -83,23 +113,56 @@ def load(
83
113
 
84
114
 
85
115
  def _plain_reader(reader, reader_args, reader_kwargs):
116
+ """
117
+ Reads data using a plain reader.
118
+
119
+ Args:
120
+ reader (str | Callable): The reader function or its name.
121
+ reader_args (list): Positional arguments for the reader function.
122
+ reader_kwargs (dict): Keyword arguments for the reader function.
123
+
124
+ Returns:
125
+ pile: A pile of Node instances.
126
+
127
+ Raises:
128
+ ValueError: If the reader is not supported.
129
+
130
+ Example usage:
131
+ >>> nodes = _plain_reader('text_reader', ['path/to/files'], {'ext': 'txt'})
132
+ """
86
133
  try:
87
134
  if reader == "text_reader":
88
135
  reader = text_reader
89
- return reader(reader_args, reader_kwargs)
136
+ nodes = reader(reader_args, reader_kwargs)
137
+ return pile(nodes)
90
138
  except Exception as e:
91
139
  raise ValueError(
92
140
  f"Reader {reader} is currently not supported. Error: {e}"
93
141
  ) from e
94
142
 
95
143
 
96
- def _langchain_reader(reader, reader_args, reader_kwargs, to_datanode: bool | Callable):
144
+ def _langchain_reader(reader, reader_args, reader_kwargs, to_lion: bool | Callable):
145
+ """
146
+ Reads data using a Langchain reader.
147
+
148
+ Args:
149
+ reader (str | Callable): The reader function or its name.
150
+ reader_args (list): Positional arguments for the reader function.
151
+ reader_kwargs (dict): Keyword arguments for the reader function.
152
+ to_lion (bool | Callable): Whether to convert the data to Node instances or a custom parser.
153
+
154
+ Returns:
155
+ pile: A pile of Node instances or custom parsed nodes.
156
+
157
+ Example usage:
158
+ >>> nodes = _langchain_reader('langchain_reader', ['arg1'], {'key': 'value'}, True)
159
+ """
97
160
  nodes = LangchainBridge.langchain_loader(reader, reader_args, reader_kwargs)
98
- if isinstance(to_datanode, bool) and to_datanode is True:
99
- nodes = [Node.from_langchain(i) for i in nodes]
161
+ if isinstance(to_lion, bool) and to_lion is True:
162
+ return pile([Node.from_langchain(i) for i in nodes])
100
163
 
101
- elif isinstance(to_datanode, Callable):
102
- nodes = _datanode_parser(nodes, to_datanode)
164
+ elif isinstance(to_lion, Callable):
165
+ nodes = _datanode_parser(nodes, to_lion)
103
166
  return nodes
104
167
 
105
168
 
@@ -109,15 +172,33 @@ def _llama_index_reader(
109
172
  reader_kwargs,
110
173
  load_args,
111
174
  load_kwargs,
112
- to_datanode: bool | Callable,
175
+ to_lion: bool | Callable,
113
176
  ):
177
+ """
178
+ Reads data using a LlamaIndex reader.
179
+
180
+ Args:
181
+ reader (str | Callable): The reader function or its name.
182
+ reader_args (list): Positional arguments for the reader function.
183
+ reader_kwargs (dict): Keyword arguments for the reader function.
184
+ load_args (list): Positional arguments for loading.
185
+ load_kwargs (dict): Keyword arguments for loading.
186
+ to_lion (bool | Callable): Whether to convert the data to Node instances or a custom parser.
187
+
188
+ Returns:
189
+ pile: A pile of Node instances or custom parsed nodes.
190
+
191
+ Example usage:
192
+ >>> nodes = _llama_index_reader('llama_reader', ['arg1'], {'key': 'value'}, [], {}, True)
193
+ """
114
194
  nodes = LlamaIndexBridge.llama_index_read_data(
115
195
  reader, reader_args, reader_kwargs, load_args, load_kwargs
116
196
  )
117
- if isinstance(to_datanode, bool) and to_datanode is True:
118
- nodes = [Node.from_llama_index(i) for i in nodes]
119
- elif isinstance(to_datanode, Callable):
120
- nodes = _datanode_parser(nodes, to_datanode)
197
+ if isinstance(to_lion, bool) and to_lion is True:
198
+ return pile([Node.from_llama_index(i) for i in nodes])
199
+
200
+ elif isinstance(to_lion, Callable):
201
+ nodes = _datanode_parser(nodes, to_lion)
121
202
  return nodes
122
203
 
123
204
 
@@ -127,8 +208,28 @@ def _self_defined_reader(
127
208
  reader_kwargs,
128
209
  load_args,
129
210
  load_kwargs,
130
- to_datanode: bool | Callable,
211
+ to_lion: bool | Callable,
131
212
  ):
213
+ """
214
+ Reads data using a self-defined reader.
215
+
216
+ Args:
217
+ reader (str | Callable): The reader function or its name.
218
+ reader_args (list): Positional arguments for the reader function.
219
+ reader_kwargs (dict): Keyword arguments for the reader function.
220
+ load_args (list): Positional arguments for loading.
221
+ load_kwargs (dict): Keyword arguments for loading.
222
+ to_lion (bool | Callable): Whether to convert the data to Node instances or a custom parser.
223
+
224
+ Returns:
225
+ pile: A pile of Node instances or custom parsed nodes.
226
+
227
+ Raises:
228
+ ValueError: If the self-defined reader is not valid.
229
+
230
+ Example usage:
231
+ >>> nodes = _self_defined_reader(custom_reader, ['arg1'], {'key': 'value'}, [], {}, custom_parser)
232
+ """
132
233
  try:
133
234
  loader = reader(*reader_args, **reader_kwargs)
134
235
  nodes = loader.load(*load_args, **load_kwargs)
@@ -137,10 +238,10 @@ def _self_defined_reader(
137
238
  f"Self defined reader {reader} is not valid. Error: {e}"
138
239
  ) from e
139
240
 
140
- if isinstance(to_datanode, bool) and to_datanode is True:
241
+ if isinstance(to_lion, bool) and to_lion is True:
141
242
  raise ValueError("Please define a valid parser to Node.")
142
- elif isinstance(to_datanode, Callable):
143
- nodes = _datanode_parser(nodes, to_datanode)
243
+ elif isinstance(to_lion, Callable):
244
+ nodes = _datanode_parser(nodes, to_lion)
144
245
  return nodes
145
246
 
146
247
 
@@ -1,10 +1,10 @@
1
1
  # use utils and schema
2
- import math
3
2
  from enum import Enum
4
3
  from pathlib import Path
5
4
  from typing import List, Union, Dict, Any, Tuple
6
5
 
7
6
  from lionagi.libs import convert, func_call
7
+ from lionagi.libs.ln_tokenize import TokenizeUtil
8
8
  from lionagi.core.generic import Node
9
9
 
10
10
 
@@ -57,7 +57,7 @@ def dir_to_path(
57
57
 
58
58
 
59
59
  def dir_to_nodes(
60
- dir: str,
60
+ dir_: str,
61
61
  ext: Union[List[str], str],
62
62
  recursive: bool = False,
63
63
  flatten: bool = True,
@@ -84,82 +84,11 @@ def dir_to_nodes(
84
84
  # converting them into Node objects.
85
85
  """
86
86
 
87
- path_list = dir_to_path(dir, ext, recursive, flatten)
87
+ path_list = dir_to_path(dir=dir_, ext=ext, recursive=recursive, flatten=flatten)
88
88
  files_info = func_call.lcall(path_list, read_text, clean=clean_text)
89
89
  return func_call.lcall(files_info, lambda x: Node(content=x[0], metadata=x[1]))
90
90
 
91
91
 
92
- def chunk_text(
93
- input: str, chunk_size: int, overlap: float, threshold: int
94
- ) -> List[Union[str, None]]:
95
- """
96
- Chunks the input text into smaller parts, with optional overlap and threshold for final chunk.
97
-
98
- Parameters:
99
- input (str): The input text to chunk.
100
-
101
- chunk_size (int): The size of each chunk.
102
-
103
- overlap (float): The amount of overlap between chunks.
104
-
105
- threshold (int): The minimum size of the final chunk.
106
-
107
- Returns:
108
- List[Union[str, None]]: A list of text chunks.
109
-
110
- Raises:
111
- ValueError: If an error occurs during chunking.
112
- """
113
-
114
- def _chunk_n1():
115
- return [input]
116
-
117
- def _chunk_n2():
118
- chunks = []
119
- chunks.append(input[: chunk_size + overlap_size])
120
-
121
- if len(input) - chunk_size > threshold:
122
- chunks.append(input[chunk_size - overlap_size :])
123
- else:
124
- return _chunk_n1()
125
-
126
- return chunks
127
-
128
- def _chunk_n3():
129
- chunks = []
130
- chunks.append(input[: chunk_size + overlap_size])
131
- for i in range(1, n_chunks - 1):
132
- start_idx = chunk_size * i - overlap_size
133
- end_idx = chunk_size * (i + 1) + overlap_size
134
- chunks.append(input[start_idx:end_idx])
135
-
136
- if len(input) - chunk_size * (n_chunks - 1) > threshold:
137
- chunks.append(input[chunk_size * (n_chunks - 1) - overlap_size :])
138
- else:
139
- chunks[-1] += input[chunk_size * (n_chunks - 1) + overlap_size :]
140
-
141
- return chunks
142
-
143
- try:
144
- if not isinstance(input, str):
145
- input = convert.to_str(input)
146
-
147
- n_chunks = math.ceil(len(input) / chunk_size)
148
- overlap_size = int(overlap / 2)
149
-
150
- if n_chunks == 1:
151
- return _chunk_n1()
152
-
153
- elif n_chunks == 2:
154
- return _chunk_n2()
155
-
156
- elif n_chunks > 2:
157
- return _chunk_n3()
158
-
159
- except Exception as e:
160
- raise ValueError(f"An error occurred while chunking the text. {e}")
161
-
162
-
163
92
  def read_text(filepath: str, clean: bool = True) -> Tuple[str, dict]:
164
93
  """
165
94
  Reads text from a file and optionally cleans it, returning the content and metadata.
@@ -202,9 +131,9 @@ def read_text(filepath: str, clean: bool = True) -> Tuple[str, dict]:
202
131
  content = f.read()
203
132
  if clean:
204
133
  # Define characters to replace and their replacements
205
- replacements = {"\\": " ", "\n": " ", "\t": " ", " ": " ", "'": " "}
134
+ replacements = {"\\": "", "\n\n": "\n"}
206
135
  for old, new in replacements.items():
207
- content = content.replace(old, new)
136
+ content = content.replace(old, new).strip()
208
137
  metadata = _get_metadata()
209
138
  return content, metadata
210
139
  except Exception as e:
@@ -223,7 +152,7 @@ def _file_to_chunks(
223
152
  "chunk_overlap": overlap,
224
153
  "chunk_threshold": threshold,
225
154
  }
226
- chunks = chunk_text(
155
+ chunks = TokenizeUtil.chunk_by_chars(
227
156
  input[field], chunk_size=chunk_size, overlap=overlap, threshold=threshold
228
157
  )
229
158
  logs = []
@@ -0,0 +1,46 @@
1
+ from .oai import OpenAIService
2
+ from .openrouter import OpenRouterService
3
+ from .ollama import OllamaService
4
+ from .transformers import TransformersService
5
+ from .litellm import LiteLLMService
6
+ from .mlx_service import MLXService
7
+ from lionagi.integrations.config.oai_configs import oai_schema
8
+ from lionagi.integrations.config.openrouter_configs import openrouter_schema
9
+
10
+ SERVICE_PROVIDERS_MAPPING = {
11
+ "openai": {
12
+ "service": OpenAIService,
13
+ "schema": oai_schema,
14
+ "default_model": "gpt-3.5-turbo",
15
+ },
16
+ "openrouter": {
17
+ "service": OpenRouterService,
18
+ "schema": openrouter_schema,
19
+ "default_model": "gpt-3.5-turbo",
20
+ },
21
+ "litellm": {
22
+ "service": LiteLLMService,
23
+ "schema": oai_schema,
24
+ "default_model": "gpt-3.5-turbo",
25
+ },
26
+ "ollama": {
27
+ "service": OllamaService,
28
+ "schema": {"model": "llama3"},
29
+ "default_model": "llama3",
30
+ },
31
+ "transformers": {
32
+ "service": TransformersService,
33
+ "schema": {"model": "gpt2"},
34
+ "default_model": "gpt2",
35
+ },
36
+ "mlx": {
37
+ "service": MLXService,
38
+ "schema": {"model": "mlx-community/OLMo-7B-hf-4bit-mlx"},
39
+ "default_model": "mlx-community/OLMo-7B-hf-4bit-mlx",
40
+ },
41
+ }
42
+
43
+ # TODO
44
+ # "Ollama": OllamaService,
45
+ # "Transformers": TransformersService,
46
+ # "MLX": MLXService,
@@ -31,12 +31,13 @@ class LiteLLMService(BaseService):
31
31
  self.acompletion = acompletion
32
32
  self.model = model
33
33
  self.kwargs = kwargs
34
+ self.allowed_kwargs = allowed_kwargs
34
35
 
35
36
  async def serve_chat(self, messages, **kwargs):
36
37
  payload = {"messages": messages}
37
38
  config = {}
38
39
  for k, v in kwargs.items():
39
- if k in allowed_kwargs:
40
+ if k in self.allowed_kwargs:
40
41
  config[k] = v
41
42
 
42
43
  kwargs = {**self.kwargs, **config}
@@ -1,13 +1,18 @@
1
+ import re
1
2
  from lionagi.libs.sys_util import SysUtil
2
3
  import lionagi.libs.ln_convert as convert
3
4
  from lionagi.libs.ln_api import BaseService
4
5
  from lionagi.integrations.config.mlx_configs import model
5
6
 
6
7
 
7
- class MlXService(BaseService):
8
+ class MLXService(BaseService):
8
9
  def __init__(self, model=model, **kwargs):
9
10
 
10
11
  SysUtil.check_import("mlx_lm")
12
+ SysUtil.check_import("ipywidgets")
13
+
14
+ if model is not None and "olmo" in str(model).lower():
15
+ SysUtil.check_import("olmo", pip_name="ai2-olmo")
11
16
 
12
17
  from mlx_lm import load, generate
13
18
 
@@ -19,16 +24,13 @@ class MlXService(BaseService):
19
24
  self.model = model_
20
25
  self.tokenizer = tokenizer
21
26
  self.generate = generate
27
+ self.allowed_kwargs = []
22
28
 
23
29
  async def serve_chat(self, messages, **kwargs):
24
30
  if "verbose" not in kwargs.keys():
25
- verbose = True
31
+ verbose = False
26
32
 
27
- prompts = [
28
- convert.to_dict(msg["content"])["instruction"]
29
- for msg in messages
30
- if msg["role"] == "user"
31
- ]
33
+ prompts = [msg["content"] for msg in messages if msg["role"] == "user"]
32
34
 
33
35
  payload = {"messages": messages}
34
36
 
@@ -39,8 +41,13 @@ class MlXService(BaseService):
39
41
  prompt=f"{prompts[-1]} \nOutput: ",
40
42
  verbose=verbose,
41
43
  )
42
- completion = {"model": self.model_name, "choices": [{"message": response}]}
43
-
44
+ if "```" in response:
45
+ regex = re.compile(r"```[\s\S]*?```")
46
+ matches = regex.findall(response)
47
+ msg = matches[0].strip("```")
48
+ completion = {"choices": [{"message": {"content": msg}}]}
49
+ else:
50
+ completion = {"choices": [{"message": {"content": response}}]}
44
51
  return payload, completion
45
52
  except Exception as e:
46
53
  self.status_tracker.num_tasks_failed += 1