lionagi 0.4.0__py3-none-any.whl → 0.5.0__py3-none-any.whl

Sign up to get free protection for your applications and to get access to all the features.
Files changed (584) hide show
  1. lionagi/__init__.py +14 -46
  2. lionagi/core/__init__.py +3 -1
  3. lionagi/core/_class_registry.py +69 -0
  4. lionagi/core/action/__init__.py +3 -13
  5. lionagi/core/action/action_manager.py +287 -0
  6. lionagi/core/action/base.py +109 -0
  7. lionagi/core/action/function_calling.py +127 -92
  8. lionagi/core/action/tool.py +172 -70
  9. lionagi/core/action/types.py +16 -0
  10. lionagi/core/communication/__init__.py +3 -0
  11. lionagi/core/communication/action_request.py +163 -0
  12. lionagi/core/communication/action_response.py +149 -0
  13. lionagi/core/communication/assistant_response.py +161 -0
  14. lionagi/core/communication/base_mail.py +49 -0
  15. lionagi/core/communication/instruction.py +376 -0
  16. lionagi/core/communication/message.py +286 -0
  17. lionagi/core/communication/message_manager.py +530 -0
  18. lionagi/core/communication/system.py +116 -0
  19. lionagi/core/communication/templates/README.md +28 -0
  20. lionagi/core/communication/templates/action_request.jinja2 +5 -0
  21. lionagi/core/communication/templates/action_response.jinja2 +9 -0
  22. lionagi/core/communication/templates/assistant_response.jinja2 +2 -0
  23. lionagi/core/communication/templates/instruction_message.jinja2 +61 -0
  24. lionagi/core/communication/templates/system_message.jinja2 +11 -0
  25. lionagi/core/communication/templates/tool_schemas.jinja2 +7 -0
  26. lionagi/core/communication/types.py +27 -0
  27. lionagi/core/communication/utils.py +254 -0
  28. lionagi/core/forms/__init__.py +3 -0
  29. lionagi/core/forms/base.py +232 -0
  30. lionagi/core/forms/form.py +791 -0
  31. lionagi/core/forms/report.py +321 -0
  32. lionagi/core/forms/types.py +13 -0
  33. lionagi/core/forms/utils.py +26 -0
  34. lionagi/core/generic/__init__.py +3 -6
  35. lionagi/core/generic/component.py +422 -0
  36. lionagi/core/generic/edge.py +143 -101
  37. lionagi/core/generic/element.py +195 -0
  38. lionagi/core/generic/graph.py +297 -180
  39. lionagi/core/generic/log.py +151 -0
  40. lionagi/core/generic/log_manager.py +320 -0
  41. lionagi/core/generic/node.py +7 -229
  42. lionagi/core/generic/pile.py +1017 -0
  43. lionagi/core/generic/progression.py +388 -0
  44. lionagi/core/generic/types.py +23 -0
  45. lionagi/core/generic/utils.py +50 -0
  46. lionagi/core/models/__init__.py +5 -0
  47. lionagi/core/models/base.py +85 -0
  48. lionagi/core/models/field_model.py +122 -0
  49. lionagi/core/models/new_model_params.py +195 -0
  50. lionagi/core/models/note.py +351 -0
  51. lionagi/core/models/operable_model.py +392 -0
  52. lionagi/core/models/schema_model.py +50 -0
  53. lionagi/core/models/types.py +10 -0
  54. lionagi/core/session/__init__.py +3 -0
  55. lionagi/core/session/branch.py +115 -415
  56. lionagi/core/session/branch_mixins.py +507 -0
  57. lionagi/core/session/session.py +122 -257
  58. lionagi/core/session/types.py +8 -0
  59. lionagi/core/typing/__init__.py +9 -0
  60. lionagi/core/typing/concepts.py +132 -0
  61. lionagi/core/typing/config.py +15 -0
  62. lionagi/core/typing/id.py +221 -0
  63. lionagi/core/typing/pydantic_.py +33 -0
  64. lionagi/core/typing/typing_.py +54 -0
  65. lionagi/integrations/__init__.py +0 -1
  66. lionagi/integrations/anthropic_/AnthropicModel.py +268 -0
  67. lionagi/integrations/anthropic_/AnthropicService.py +113 -0
  68. lionagi/integrations/anthropic_/__init__.py +3 -0
  69. lionagi/integrations/anthropic_/anthropic_max_output_token_data.yaml +7 -0
  70. lionagi/integrations/anthropic_/anthropic_price_data.yaml +14 -0
  71. lionagi/integrations/anthropic_/api_endpoints/__init__.py +3 -0
  72. lionagi/integrations/anthropic_/api_endpoints/api_request.py +277 -0
  73. lionagi/integrations/anthropic_/api_endpoints/data_models.py +40 -0
  74. lionagi/integrations/anthropic_/api_endpoints/match_response.py +119 -0
  75. lionagi/integrations/anthropic_/api_endpoints/messages/__init__.py +3 -0
  76. lionagi/integrations/anthropic_/api_endpoints/messages/request/__init__.py +3 -0
  77. lionagi/integrations/anthropic_/api_endpoints/messages/request/message_models.py +14 -0
  78. lionagi/integrations/anthropic_/api_endpoints/messages/request/request_body.py +74 -0
  79. lionagi/integrations/anthropic_/api_endpoints/messages/response/content_models.py +32 -0
  80. lionagi/integrations/anthropic_/api_endpoints/messages/response/response_body.py +101 -0
  81. lionagi/integrations/anthropic_/api_endpoints/messages/response/usage_models.py +25 -0
  82. lionagi/integrations/anthropic_/version.py +5 -0
  83. lionagi/integrations/groq_/GroqModel.py +318 -0
  84. lionagi/integrations/groq_/GroqService.py +147 -0
  85. lionagi/integrations/groq_/__init__.py +3 -0
  86. lionagi/integrations/groq_/api_endpoints/data_models.py +187 -0
  87. lionagi/integrations/groq_/api_endpoints/groq_request.py +288 -0
  88. lionagi/integrations/groq_/api_endpoints/match_response.py +106 -0
  89. lionagi/integrations/groq_/api_endpoints/response_utils.py +105 -0
  90. lionagi/integrations/groq_/groq_max_output_token_data.yaml +21 -0
  91. lionagi/integrations/groq_/groq_price_data.yaml +58 -0
  92. lionagi/integrations/groq_/groq_rate_limits.yaml +105 -0
  93. lionagi/integrations/groq_/version.py +5 -0
  94. lionagi/integrations/litellm_/__init__.py +3 -0
  95. lionagi/integrations/litellm_/imodel.py +69 -0
  96. lionagi/integrations/ollama_/OllamaModel.py +244 -0
  97. lionagi/integrations/ollama_/OllamaService.py +138 -0
  98. lionagi/integrations/ollama_/__init__.py +3 -0
  99. lionagi/integrations/ollama_/api_endpoints/__init__.py +3 -0
  100. lionagi/integrations/ollama_/api_endpoints/api_request.py +179 -0
  101. lionagi/integrations/ollama_/api_endpoints/chat_completion/__init__.py +3 -0
  102. lionagi/integrations/ollama_/api_endpoints/chat_completion/message_models.py +31 -0
  103. lionagi/integrations/ollama_/api_endpoints/chat_completion/request_body.py +46 -0
  104. lionagi/integrations/ollama_/api_endpoints/chat_completion/response_body.py +67 -0
  105. lionagi/integrations/ollama_/api_endpoints/chat_completion/tool_models.py +49 -0
  106. lionagi/integrations/ollama_/api_endpoints/completion/request_body.py +72 -0
  107. lionagi/integrations/ollama_/api_endpoints/completion/response_body.py +59 -0
  108. lionagi/integrations/ollama_/api_endpoints/data_models.py +15 -0
  109. lionagi/integrations/ollama_/api_endpoints/embedding/request_body.py +33 -0
  110. lionagi/integrations/ollama_/api_endpoints/embedding/response_body.py +29 -0
  111. lionagi/integrations/ollama_/api_endpoints/match_data_model.py +62 -0
  112. lionagi/integrations/ollama_/api_endpoints/match_response.py +190 -0
  113. lionagi/integrations/ollama_/api_endpoints/model/__init__.py +3 -0
  114. lionagi/integrations/ollama_/api_endpoints/model/copy_model.py +13 -0
  115. lionagi/integrations/ollama_/api_endpoints/model/create_model.py +28 -0
  116. lionagi/integrations/ollama_/api_endpoints/model/delete_model.py +11 -0
  117. lionagi/integrations/ollama_/api_endpoints/model/list_model.py +60 -0
  118. lionagi/integrations/ollama_/api_endpoints/model/pull_model.py +34 -0
  119. lionagi/integrations/ollama_/api_endpoints/model/push_model.py +35 -0
  120. lionagi/integrations/ollama_/api_endpoints/model/show_model.py +36 -0
  121. lionagi/integrations/ollama_/api_endpoints/option_models.py +68 -0
  122. lionagi/integrations/openai_/OpenAIModel.py +414 -0
  123. lionagi/integrations/openai_/OpenAIService.py +426 -0
  124. lionagi/integrations/openai_/api_endpoints/__init__.py +3 -0
  125. lionagi/integrations/openai_/api_endpoints/api_request.py +277 -0
  126. lionagi/integrations/openai_/api_endpoints/audio/__init__.py +9 -0
  127. lionagi/integrations/openai_/api_endpoints/audio/speech_models.py +34 -0
  128. lionagi/integrations/openai_/api_endpoints/audio/transcription_models.py +136 -0
  129. lionagi/integrations/openai_/api_endpoints/audio/translation_models.py +41 -0
  130. lionagi/integrations/openai_/api_endpoints/audio/types.py +41 -0
  131. lionagi/integrations/openai_/api_endpoints/batch/__init__.py +17 -0
  132. lionagi/integrations/openai_/api_endpoints/batch/batch_models.py +146 -0
  133. lionagi/integrations/openai_/api_endpoints/batch/cancel_batch.py +7 -0
  134. lionagi/integrations/openai_/api_endpoints/batch/create_batch.py +26 -0
  135. lionagi/integrations/openai_/api_endpoints/batch/list_batch.py +37 -0
  136. lionagi/integrations/openai_/api_endpoints/batch/request_object_models.py +65 -0
  137. lionagi/integrations/openai_/api_endpoints/batch/retrieve_batch.py +7 -0
  138. lionagi/integrations/openai_/api_endpoints/batch/types.py +4 -0
  139. lionagi/integrations/openai_/api_endpoints/chat_completions/__init__.py +1 -0
  140. lionagi/integrations/openai_/api_endpoints/chat_completions/request/__init__.py +39 -0
  141. lionagi/integrations/openai_/api_endpoints/chat_completions/request/message_models.py +121 -0
  142. lionagi/integrations/openai_/api_endpoints/chat_completions/request/request_body.py +221 -0
  143. lionagi/integrations/openai_/api_endpoints/chat_completions/request/response_format.py +71 -0
  144. lionagi/integrations/openai_/api_endpoints/chat_completions/request/stream_options.py +14 -0
  145. lionagi/integrations/openai_/api_endpoints/chat_completions/request/tool_choice_models.py +17 -0
  146. lionagi/integrations/openai_/api_endpoints/chat_completions/request/tool_models.py +54 -0
  147. lionagi/integrations/openai_/api_endpoints/chat_completions/request/types.py +18 -0
  148. lionagi/integrations/openai_/api_endpoints/chat_completions/response/choice_models.py +62 -0
  149. lionagi/integrations/openai_/api_endpoints/chat_completions/response/function_models.py +16 -0
  150. lionagi/integrations/openai_/api_endpoints/chat_completions/response/log_prob_models.py +47 -0
  151. lionagi/integrations/openai_/api_endpoints/chat_completions/response/message_models.py +25 -0
  152. lionagi/integrations/openai_/api_endpoints/chat_completions/response/response_body.py +99 -0
  153. lionagi/integrations/openai_/api_endpoints/chat_completions/response/types.py +8 -0
  154. lionagi/integrations/openai_/api_endpoints/chat_completions/response/usage_models.py +24 -0
  155. lionagi/integrations/openai_/api_endpoints/chat_completions/util.py +46 -0
  156. lionagi/integrations/openai_/api_endpoints/data_models.py +23 -0
  157. lionagi/integrations/openai_/api_endpoints/embeddings/__init__.py +3 -0
  158. lionagi/integrations/openai_/api_endpoints/embeddings/request_body.py +79 -0
  159. lionagi/integrations/openai_/api_endpoints/embeddings/response_body.py +67 -0
  160. lionagi/integrations/openai_/api_endpoints/files/__init__.py +11 -0
  161. lionagi/integrations/openai_/api_endpoints/files/delete_file.py +20 -0
  162. lionagi/integrations/openai_/api_endpoints/files/file_models.py +56 -0
  163. lionagi/integrations/openai_/api_endpoints/files/list_files.py +27 -0
  164. lionagi/integrations/openai_/api_endpoints/files/retrieve_file.py +9 -0
  165. lionagi/integrations/openai_/api_endpoints/files/upload_file.py +38 -0
  166. lionagi/integrations/openai_/api_endpoints/fine_tuning/__init__.py +37 -0
  167. lionagi/integrations/openai_/api_endpoints/fine_tuning/cancel_jobs.py +9 -0
  168. lionagi/integrations/openai_/api_endpoints/fine_tuning/create_jobs.py +133 -0
  169. lionagi/integrations/openai_/api_endpoints/fine_tuning/fine_tuning_job_checkpoint_models.py +58 -0
  170. lionagi/integrations/openai_/api_endpoints/fine_tuning/fine_tuning_job_event_models.py +31 -0
  171. lionagi/integrations/openai_/api_endpoints/fine_tuning/fine_tuning_job_models.py +140 -0
  172. lionagi/integrations/openai_/api_endpoints/fine_tuning/list_fine_tuning_checkpoints.py +51 -0
  173. lionagi/integrations/openai_/api_endpoints/fine_tuning/list_fine_tuning_events.py +42 -0
  174. lionagi/integrations/openai_/api_endpoints/fine_tuning/list_fine_tuning_jobs.py +31 -0
  175. lionagi/integrations/openai_/api_endpoints/fine_tuning/retrieve_jobs.py +9 -0
  176. lionagi/integrations/openai_/api_endpoints/fine_tuning/training_format.py +30 -0
  177. lionagi/integrations/openai_/api_endpoints/images/__init__.py +9 -0
  178. lionagi/integrations/openai_/api_endpoints/images/image_edit_models.py +69 -0
  179. lionagi/integrations/openai_/api_endpoints/images/image_models.py +56 -0
  180. lionagi/integrations/openai_/api_endpoints/images/image_variation_models.py +56 -0
  181. lionagi/integrations/openai_/api_endpoints/images/response_body.py +30 -0
  182. lionagi/integrations/openai_/api_endpoints/match_data_model.py +197 -0
  183. lionagi/integrations/openai_/api_endpoints/match_response.py +336 -0
  184. lionagi/integrations/openai_/api_endpoints/models/__init__.py +7 -0
  185. lionagi/integrations/openai_/api_endpoints/models/delete_fine_tuned_model.py +17 -0
  186. lionagi/integrations/openai_/api_endpoints/models/models_models.py +31 -0
  187. lionagi/integrations/openai_/api_endpoints/models/retrieve_model.py +9 -0
  188. lionagi/integrations/openai_/api_endpoints/moderations/__init__.py +3 -0
  189. lionagi/integrations/openai_/api_endpoints/moderations/request_body.py +20 -0
  190. lionagi/integrations/openai_/api_endpoints/moderations/response_body.py +139 -0
  191. lionagi/integrations/openai_/api_endpoints/uploads/__init__.py +19 -0
  192. lionagi/integrations/openai_/api_endpoints/uploads/add_upload_part.py +11 -0
  193. lionagi/integrations/openai_/api_endpoints/uploads/cancel_upload.py +7 -0
  194. lionagi/integrations/openai_/api_endpoints/uploads/complete_upload.py +18 -0
  195. lionagi/integrations/openai_/api_endpoints/uploads/create_upload.py +17 -0
  196. lionagi/integrations/openai_/api_endpoints/uploads/uploads_models.py +52 -0
  197. lionagi/integrations/openai_/image_token_calculator/image_token_calculator.py +92 -0
  198. lionagi/integrations/openai_/image_token_calculator/openai_image_token_data.yaml +15 -0
  199. lionagi/integrations/openai_/openai_max_output_token_data.yaml +12 -0
  200. lionagi/integrations/openai_/openai_price_data.yaml +26 -0
  201. lionagi/integrations/openai_/version.py +1 -0
  202. lionagi/integrations/pandas_/__init__.py +24 -0
  203. lionagi/integrations/pandas_/extend_df.py +61 -0
  204. lionagi/integrations/pandas_/read.py +103 -0
  205. lionagi/integrations/pandas_/remove_rows.py +61 -0
  206. lionagi/integrations/pandas_/replace_keywords.py +65 -0
  207. lionagi/integrations/pandas_/save.py +131 -0
  208. lionagi/integrations/pandas_/search_keywords.py +69 -0
  209. lionagi/integrations/pandas_/to_df.py +196 -0
  210. lionagi/integrations/pandas_/update_cells.py +54 -0
  211. lionagi/integrations/perplexity_/PerplexityModel.py +269 -0
  212. lionagi/integrations/perplexity_/PerplexityService.py +109 -0
  213. lionagi/integrations/perplexity_/__init__.py +3 -0
  214. lionagi/integrations/perplexity_/api_endpoints/api_request.py +171 -0
  215. lionagi/integrations/perplexity_/api_endpoints/chat_completions/request/request_body.py +121 -0
  216. lionagi/integrations/perplexity_/api_endpoints/chat_completions/response/response_body.py +146 -0
  217. lionagi/integrations/perplexity_/api_endpoints/data_models.py +63 -0
  218. lionagi/integrations/perplexity_/api_endpoints/match_response.py +26 -0
  219. lionagi/integrations/perplexity_/perplexity_max_output_token_data.yaml +3 -0
  220. lionagi/integrations/perplexity_/perplexity_price_data.yaml +10 -0
  221. lionagi/integrations/perplexity_/version.py +1 -0
  222. lionagi/integrations/pydantic_/__init__.py +8 -0
  223. lionagi/integrations/pydantic_/break_down_annotation.py +81 -0
  224. lionagi/integrations/pydantic_/new_model.py +208 -0
  225. lionagi/integrations/services.py +17 -0
  226. lionagi/libs/__init__.py +0 -55
  227. lionagi/libs/compress/models.py +62 -0
  228. lionagi/libs/compress/utils.py +81 -0
  229. lionagi/libs/constants.py +98 -0
  230. lionagi/libs/file/chunk.py +265 -0
  231. lionagi/libs/file/file_ops.py +114 -0
  232. lionagi/libs/file/params.py +212 -0
  233. lionagi/libs/file/path.py +301 -0
  234. lionagi/libs/file/process.py +139 -0
  235. lionagi/libs/file/save.py +90 -0
  236. lionagi/libs/file/types.py +22 -0
  237. lionagi/libs/func/async_calls/__init__.py +21 -0
  238. lionagi/libs/func/async_calls/alcall.py +157 -0
  239. lionagi/libs/func/async_calls/bcall.py +82 -0
  240. lionagi/libs/func/async_calls/mcall.py +134 -0
  241. lionagi/libs/func/async_calls/pcall.py +149 -0
  242. lionagi/libs/func/async_calls/rcall.py +185 -0
  243. lionagi/libs/func/async_calls/tcall.py +114 -0
  244. lionagi/libs/func/async_calls/ucall.py +85 -0
  245. lionagi/libs/func/decorators.py +277 -0
  246. lionagi/libs/func/lcall.py +57 -0
  247. lionagi/libs/func/params.py +64 -0
  248. lionagi/libs/func/throttle.py +119 -0
  249. lionagi/libs/func/types.py +39 -0
  250. lionagi/libs/func/utils.py +96 -0
  251. lionagi/libs/package/imports.py +162 -0
  252. lionagi/libs/package/management.py +58 -0
  253. lionagi/libs/package/params.py +26 -0
  254. lionagi/libs/package/system.py +18 -0
  255. lionagi/libs/package/types.py +26 -0
  256. lionagi/libs/parse/__init__.py +1 -0
  257. lionagi/libs/parse/flatten/__init__.py +9 -0
  258. lionagi/libs/parse/flatten/flatten.py +168 -0
  259. lionagi/libs/parse/flatten/params.py +52 -0
  260. lionagi/libs/parse/flatten/unflatten.py +79 -0
  261. lionagi/libs/parse/json/__init__.py +27 -0
  262. lionagi/libs/parse/json/as_readable.py +104 -0
  263. lionagi/libs/parse/json/extract.py +102 -0
  264. lionagi/libs/parse/json/parse.py +179 -0
  265. lionagi/libs/parse/json/schema.py +227 -0
  266. lionagi/libs/parse/json/to_json.py +71 -0
  267. lionagi/libs/parse/nested/__init__.py +33 -0
  268. lionagi/libs/parse/nested/nfilter.py +55 -0
  269. lionagi/libs/parse/nested/nget.py +40 -0
  270. lionagi/libs/parse/nested/ninsert.py +103 -0
  271. lionagi/libs/parse/nested/nmerge.py +155 -0
  272. lionagi/libs/parse/nested/npop.py +66 -0
  273. lionagi/libs/parse/nested/nset.py +89 -0
  274. lionagi/libs/parse/nested/to_flat_list.py +64 -0
  275. lionagi/libs/parse/nested/utils.py +185 -0
  276. lionagi/libs/parse/string_parse/__init__.py +11 -0
  277. lionagi/libs/parse/string_parse/code_block.py +73 -0
  278. lionagi/libs/parse/string_parse/docstring.py +179 -0
  279. lionagi/libs/parse/string_parse/function_.py +92 -0
  280. lionagi/libs/parse/type_convert/__init__.py +19 -0
  281. lionagi/libs/parse/type_convert/params.py +145 -0
  282. lionagi/libs/parse/type_convert/to_dict.py +333 -0
  283. lionagi/libs/parse/type_convert/to_list.py +186 -0
  284. lionagi/libs/parse/type_convert/to_num.py +358 -0
  285. lionagi/libs/parse/type_convert/to_str.py +195 -0
  286. lionagi/libs/parse/types.py +9 -0
  287. lionagi/libs/parse/validate/__init__.py +14 -0
  288. lionagi/libs/parse/validate/boolean.py +96 -0
  289. lionagi/libs/parse/validate/keys.py +150 -0
  290. lionagi/libs/parse/validate/mapping.py +109 -0
  291. lionagi/libs/parse/validate/params.py +62 -0
  292. lionagi/libs/parse/xml/__init__.py +10 -0
  293. lionagi/libs/parse/xml/convert.py +56 -0
  294. lionagi/libs/parse/xml/parser.py +93 -0
  295. lionagi/libs/string_similarity/__init__.py +32 -0
  296. lionagi/libs/string_similarity/algorithms.py +219 -0
  297. lionagi/libs/string_similarity/matcher.py +102 -0
  298. lionagi/libs/string_similarity/utils.py +15 -0
  299. lionagi/libs/utils.py +255 -0
  300. lionagi/operations/__init__.py +3 -6
  301. lionagi/operations/brainstorm/__init__.py +3 -0
  302. lionagi/operations/brainstorm/brainstorm.py +204 -0
  303. lionagi/operations/brainstorm/prompt.py +1 -0
  304. lionagi/operations/plan/__init__.py +3 -0
  305. lionagi/operations/plan/plan.py +172 -0
  306. lionagi/operations/plan/prompt.py +21 -0
  307. lionagi/operations/select/__init__.py +3 -0
  308. lionagi/operations/select/prompt.py +1 -0
  309. lionagi/operations/select/select.py +100 -0
  310. lionagi/operations/select/utils.py +107 -0
  311. lionagi/operations/utils.py +35 -0
  312. lionagi/protocols/adapters/adapter.py +79 -0
  313. lionagi/protocols/adapters/json_adapter.py +43 -0
  314. lionagi/protocols/adapters/pandas_adapter.py +96 -0
  315. lionagi/protocols/configs/__init__.py +15 -0
  316. lionagi/protocols/configs/branch_config.py +86 -0
  317. lionagi/protocols/configs/id_config.py +15 -0
  318. lionagi/protocols/configs/imodel_config.py +73 -0
  319. lionagi/protocols/configs/log_config.py +93 -0
  320. lionagi/protocols/configs/retry_config.py +29 -0
  321. lionagi/protocols/operatives/__init__.py +15 -0
  322. lionagi/protocols/operatives/action.py +181 -0
  323. lionagi/protocols/operatives/instruct.py +196 -0
  324. lionagi/protocols/operatives/operative.py +182 -0
  325. lionagi/protocols/operatives/prompts.py +232 -0
  326. lionagi/protocols/operatives/reason.py +56 -0
  327. lionagi/protocols/operatives/step.py +217 -0
  328. lionagi/protocols/registries/_component_registry.py +19 -0
  329. lionagi/protocols/registries/_pile_registry.py +26 -0
  330. lionagi/service/__init__.py +13 -0
  331. lionagi/service/complete_request_info.py +11 -0
  332. lionagi/service/imodel.py +110 -0
  333. lionagi/service/rate_limiter.py +108 -0
  334. lionagi/service/service.py +37 -0
  335. lionagi/service/service_match_util.py +131 -0
  336. lionagi/service/service_util.py +72 -0
  337. lionagi/service/token_calculator.py +51 -0
  338. lionagi/settings.py +136 -0
  339. lionagi/strategies/base.py +53 -0
  340. lionagi/strategies/concurrent.py +71 -0
  341. lionagi/strategies/concurrent_chunk.py +43 -0
  342. lionagi/strategies/concurrent_sequential_chunk.py +104 -0
  343. lionagi/strategies/params.py +128 -0
  344. lionagi/strategies/sequential.py +23 -0
  345. lionagi/strategies/sequential_chunk.py +89 -0
  346. lionagi/strategies/sequential_concurrent_chunk.py +100 -0
  347. lionagi/strategies/types.py +21 -0
  348. lionagi/strategies/utils.py +49 -0
  349. lionagi/version.py +1 -1
  350. lionagi-0.5.0.dist-info/METADATA +348 -0
  351. lionagi-0.5.0.dist-info/RECORD +373 -0
  352. {lionagi-0.4.0.dist-info → lionagi-0.5.0.dist-info}/WHEEL +1 -1
  353. lionagi/core/_setting/_setting.py +0 -59
  354. lionagi/core/action/README.md +0 -20
  355. lionagi/core/action/manual.py +0 -1
  356. lionagi/core/action/node.py +0 -94
  357. lionagi/core/action/tool_manager.py +0 -342
  358. lionagi/core/agent/README.md +0 -1
  359. lionagi/core/agent/base_agent.py +0 -82
  360. lionagi/core/agent/eval/README.md +0 -1
  361. lionagi/core/agent/eval/evaluator.py +0 -1
  362. lionagi/core/agent/eval/vote.py +0 -40
  363. lionagi/core/agent/learn/learner.py +0 -59
  364. lionagi/core/agent/plan/unit_template.py +0 -1
  365. lionagi/core/collections/README.md +0 -23
  366. lionagi/core/collections/__init__.py +0 -16
  367. lionagi/core/collections/_logger.py +0 -312
  368. lionagi/core/collections/abc/README.md +0 -63
  369. lionagi/core/collections/abc/__init__.py +0 -53
  370. lionagi/core/collections/abc/component.py +0 -620
  371. lionagi/core/collections/abc/concepts.py +0 -277
  372. lionagi/core/collections/abc/exceptions.py +0 -136
  373. lionagi/core/collections/abc/util.py +0 -45
  374. lionagi/core/collections/exchange.py +0 -146
  375. lionagi/core/collections/flow.py +0 -416
  376. lionagi/core/collections/model.py +0 -465
  377. lionagi/core/collections/pile.py +0 -1232
  378. lionagi/core/collections/progression.py +0 -221
  379. lionagi/core/collections/util.py +0 -73
  380. lionagi/core/director/README.md +0 -1
  381. lionagi/core/director/direct.py +0 -298
  382. lionagi/core/director/director.py +0 -2
  383. lionagi/core/director/operations/select.py +0 -3
  384. lionagi/core/director/operations/utils.py +0 -6
  385. lionagi/core/engine/branch_engine.py +0 -361
  386. lionagi/core/engine/instruction_map_engine.py +0 -213
  387. lionagi/core/engine/sandbox_.py +0 -16
  388. lionagi/core/engine/script_engine.py +0 -89
  389. lionagi/core/executor/base_executor.py +0 -97
  390. lionagi/core/executor/graph_executor.py +0 -335
  391. lionagi/core/executor/neo4j_executor.py +0 -394
  392. lionagi/core/generic/README.md +0 -0
  393. lionagi/core/generic/edge_condition.py +0 -17
  394. lionagi/core/generic/hyperedge.py +0 -1
  395. lionagi/core/generic/tree.py +0 -49
  396. lionagi/core/generic/tree_node.py +0 -85
  397. lionagi/core/mail/__init__.py +0 -11
  398. lionagi/core/mail/mail.py +0 -26
  399. lionagi/core/mail/mail_manager.py +0 -185
  400. lionagi/core/mail/package.py +0 -49
  401. lionagi/core/mail/start_mail.py +0 -36
  402. lionagi/core/message/__init__.py +0 -18
  403. lionagi/core/message/action_request.py +0 -114
  404. lionagi/core/message/action_response.py +0 -121
  405. lionagi/core/message/assistant_response.py +0 -80
  406. lionagi/core/message/instruction.py +0 -194
  407. lionagi/core/message/message.py +0 -86
  408. lionagi/core/message/system.py +0 -71
  409. lionagi/core/message/util.py +0 -274
  410. lionagi/core/report/__init__.py +0 -4
  411. lionagi/core/report/base.py +0 -201
  412. lionagi/core/report/form.py +0 -212
  413. lionagi/core/report/report.py +0 -150
  414. lionagi/core/report/util.py +0 -15
  415. lionagi/core/rule/_default.py +0 -17
  416. lionagi/core/rule/action.py +0 -87
  417. lionagi/core/rule/base.py +0 -234
  418. lionagi/core/rule/boolean.py +0 -56
  419. lionagi/core/rule/choice.py +0 -48
  420. lionagi/core/rule/mapping.py +0 -82
  421. lionagi/core/rule/number.py +0 -73
  422. lionagi/core/rule/rulebook.py +0 -45
  423. lionagi/core/rule/string.py +0 -43
  424. lionagi/core/rule/util.py +0 -0
  425. lionagi/core/session/directive_mixin.py +0 -307
  426. lionagi/core/structure/__init__.py +0 -1
  427. lionagi/core/structure/chain.py +0 -1
  428. lionagi/core/structure/forest.py +0 -1
  429. lionagi/core/structure/graph.py +0 -1
  430. lionagi/core/structure/tree.py +0 -1
  431. lionagi/core/unit/__init__.py +0 -4
  432. lionagi/core/unit/parallel_unit.py +0 -234
  433. lionagi/core/unit/template/action.py +0 -65
  434. lionagi/core/unit/template/base.py +0 -35
  435. lionagi/core/unit/template/plan.py +0 -69
  436. lionagi/core/unit/template/predict.py +0 -95
  437. lionagi/core/unit/template/score.py +0 -108
  438. lionagi/core/unit/template/select.py +0 -91
  439. lionagi/core/unit/unit.py +0 -452
  440. lionagi/core/unit/unit_form.py +0 -290
  441. lionagi/core/unit/unit_mixin.py +0 -1166
  442. lionagi/core/unit/util.py +0 -103
  443. lionagi/core/validator/validator.py +0 -376
  444. lionagi/core/work/work.py +0 -59
  445. lionagi/core/work/work_edge.py +0 -102
  446. lionagi/core/work/work_function.py +0 -114
  447. lionagi/core/work/work_function_node.py +0 -50
  448. lionagi/core/work/work_queue.py +0 -90
  449. lionagi/core/work/work_task.py +0 -151
  450. lionagi/core/work/worker.py +0 -410
  451. lionagi/core/work/worker_engine.py +0 -208
  452. lionagi/core/work/worklog.py +0 -108
  453. lionagi/experimental/compressor/base.py +0 -47
  454. lionagi/experimental/compressor/llm_compressor.py +0 -265
  455. lionagi/experimental/compressor/llm_summarizer.py +0 -61
  456. lionagi/experimental/compressor/util.py +0 -70
  457. lionagi/experimental/directive/README.md +0 -1
  458. lionagi/experimental/directive/__init__.py +0 -19
  459. lionagi/experimental/directive/parser/base_parser.py +0 -294
  460. lionagi/experimental/directive/parser/base_syntax.txt +0 -200
  461. lionagi/experimental/directive/template/base_template.py +0 -71
  462. lionagi/experimental/directive/template/schema.py +0 -36
  463. lionagi/experimental/directive/tokenizer.py +0 -59
  464. lionagi/experimental/evaluator/README.md +0 -1
  465. lionagi/experimental/evaluator/ast_evaluator.py +0 -119
  466. lionagi/experimental/evaluator/base_evaluator.py +0 -213
  467. lionagi/experimental/knowledge/__init__.py +0 -0
  468. lionagi/experimental/knowledge/base.py +0 -10
  469. lionagi/experimental/knowledge/graph.py +0 -0
  470. lionagi/experimental/memory/__init__.py +0 -0
  471. lionagi/experimental/strategies/__init__.py +0 -0
  472. lionagi/experimental/strategies/base.py +0 -1
  473. lionagi/integrations/bridge/__init__.py +0 -4
  474. lionagi/integrations/bridge/autogen_/__init__.py +0 -0
  475. lionagi/integrations/bridge/autogen_/autogen_.py +0 -127
  476. lionagi/integrations/bridge/langchain_/__init__.py +0 -0
  477. lionagi/integrations/bridge/langchain_/documents.py +0 -138
  478. lionagi/integrations/bridge/langchain_/langchain_bridge.py +0 -68
  479. lionagi/integrations/bridge/llamaindex_/__init__.py +0 -0
  480. lionagi/integrations/bridge/llamaindex_/index.py +0 -36
  481. lionagi/integrations/bridge/llamaindex_/llama_index_bridge.py +0 -108
  482. lionagi/integrations/bridge/llamaindex_/llama_pack.py +0 -256
  483. lionagi/integrations/bridge/llamaindex_/node_parser.py +0 -92
  484. lionagi/integrations/bridge/llamaindex_/reader.py +0 -201
  485. lionagi/integrations/bridge/llamaindex_/textnode.py +0 -59
  486. lionagi/integrations/bridge/pydantic_/__init__.py +0 -0
  487. lionagi/integrations/bridge/pydantic_/pydantic_bridge.py +0 -7
  488. lionagi/integrations/bridge/transformers_/__init__.py +0 -0
  489. lionagi/integrations/bridge/transformers_/install_.py +0 -39
  490. lionagi/integrations/chunker/__init__.py +0 -0
  491. lionagi/integrations/chunker/chunk.py +0 -314
  492. lionagi/integrations/config/__init__.py +0 -4
  493. lionagi/integrations/config/mlx_configs.py +0 -1
  494. lionagi/integrations/config/oai_configs.py +0 -154
  495. lionagi/integrations/config/ollama_configs.py +0 -1
  496. lionagi/integrations/config/openrouter_configs.py +0 -74
  497. lionagi/integrations/langchain_/__init__.py +0 -0
  498. lionagi/integrations/llamaindex_/__init__.py +0 -0
  499. lionagi/integrations/loader/__init__.py +0 -0
  500. lionagi/integrations/loader/load.py +0 -257
  501. lionagi/integrations/loader/load_util.py +0 -214
  502. lionagi/integrations/provider/__init__.py +0 -11
  503. lionagi/integrations/provider/_mapping.py +0 -47
  504. lionagi/integrations/provider/litellm.py +0 -53
  505. lionagi/integrations/provider/mistralai.py +0 -1
  506. lionagi/integrations/provider/mlx_service.py +0 -55
  507. lionagi/integrations/provider/oai.py +0 -196
  508. lionagi/integrations/provider/ollama.py +0 -55
  509. lionagi/integrations/provider/openrouter.py +0 -170
  510. lionagi/integrations/provider/services.py +0 -138
  511. lionagi/integrations/provider/transformers.py +0 -108
  512. lionagi/integrations/storage/__init__.py +0 -3
  513. lionagi/integrations/storage/neo4j.py +0 -681
  514. lionagi/integrations/storage/storage_util.py +0 -302
  515. lionagi/integrations/storage/structure_excel.py +0 -291
  516. lionagi/integrations/storage/to_csv.py +0 -70
  517. lionagi/integrations/storage/to_excel.py +0 -91
  518. lionagi/libs/ln_api.py +0 -944
  519. lionagi/libs/ln_async.py +0 -208
  520. lionagi/libs/ln_context.py +0 -37
  521. lionagi/libs/ln_convert.py +0 -671
  522. lionagi/libs/ln_dataframe.py +0 -187
  523. lionagi/libs/ln_func_call.py +0 -1328
  524. lionagi/libs/ln_image.py +0 -114
  525. lionagi/libs/ln_knowledge_graph.py +0 -422
  526. lionagi/libs/ln_nested.py +0 -822
  527. lionagi/libs/ln_parse.py +0 -750
  528. lionagi/libs/ln_queue.py +0 -107
  529. lionagi/libs/ln_tokenize.py +0 -179
  530. lionagi/libs/ln_validate.py +0 -299
  531. lionagi/libs/special_tokens.py +0 -172
  532. lionagi/libs/sys_util.py +0 -710
  533. lionagi/lions/__init__.py +0 -0
  534. lionagi/lions/coder/__init__.py +0 -0
  535. lionagi/lions/coder/add_feature.py +0 -20
  536. lionagi/lions/coder/base_prompts.py +0 -22
  537. lionagi/lions/coder/code_form.py +0 -15
  538. lionagi/lions/coder/coder.py +0 -184
  539. lionagi/lions/coder/util.py +0 -101
  540. lionagi/lions/director/__init__.py +0 -0
  541. lionagi/lions/judge/__init__.py +0 -0
  542. lionagi/lions/judge/config.py +0 -8
  543. lionagi/lions/judge/data/__init__.py +0 -0
  544. lionagi/lions/judge/data/sample_codes.py +0 -526
  545. lionagi/lions/judge/data/sample_rurbic.py +0 -48
  546. lionagi/lions/judge/forms/__init__.py +0 -0
  547. lionagi/lions/judge/forms/code_analysis_form.py +0 -126
  548. lionagi/lions/judge/rubric.py +0 -34
  549. lionagi/lions/judge/services/__init__.py +0 -0
  550. lionagi/lions/judge/services/judge_code.py +0 -49
  551. lionagi/lions/researcher/__init__.py +0 -0
  552. lionagi/lions/researcher/data_source/__init__.py +0 -0
  553. lionagi/lions/researcher/data_source/finhub_.py +0 -192
  554. lionagi/lions/researcher/data_source/google_.py +0 -207
  555. lionagi/lions/researcher/data_source/wiki_.py +0 -98
  556. lionagi/lions/researcher/data_source/yfinance_.py +0 -21
  557. lionagi/operations/brainstorm.py +0 -87
  558. lionagi/operations/config.py +0 -6
  559. lionagi/operations/rank.py +0 -102
  560. lionagi/operations/score.py +0 -144
  561. lionagi/operations/select.py +0 -141
  562. lionagi-0.4.0.dist-info/METADATA +0 -241
  563. lionagi-0.4.0.dist-info/RECORD +0 -249
  564. /lionagi/{core/_setting → integrations/anthropic_/api_endpoints/messages/response}/__init__.py +0 -0
  565. /lionagi/{core/agent → integrations/groq_/api_endpoints}/__init__.py +0 -0
  566. /lionagi/{core/agent/eval → integrations/ollama_/api_endpoints/completion}/__init__.py +0 -0
  567. /lionagi/{core/agent/learn → integrations/ollama_/api_endpoints/embedding}/__init__.py +0 -0
  568. /lionagi/{core/agent/plan → integrations/openai_}/__init__.py +0 -0
  569. /lionagi/{core/director → integrations/openai_/api_endpoints/chat_completions/response}/__init__.py +0 -0
  570. /lionagi/{core/director/operations → integrations/openai_/image_token_calculator}/__init__.py +0 -0
  571. /lionagi/{core/engine → integrations/perplexity_/api_endpoints}/__init__.py +0 -0
  572. /lionagi/{core/executor → integrations/perplexity_/api_endpoints/chat_completions}/__init__.py +0 -0
  573. /lionagi/{core/generic/registry/component_registry → integrations/perplexity_/api_endpoints/chat_completions/request}/__init__.py +0 -0
  574. /lionagi/{core/rule → integrations/perplexity_/api_endpoints/chat_completions/response}/__init__.py +0 -0
  575. /lionagi/{core/unit/template → libs/compress}/__init__.py +0 -0
  576. /lionagi/{core/validator → libs/file}/__init__.py +0 -0
  577. /lionagi/{core/work → libs/func}/__init__.py +0 -0
  578. /lionagi/{experimental → libs/package}/__init__.py +0 -0
  579. /lionagi/{core/agent/plan/plan.py → libs/parse/params.py} +0 -0
  580. /lionagi/{experimental/compressor → protocols}/__init__.py +0 -0
  581. /lionagi/{experimental/directive/parser → protocols/adapters}/__init__.py +0 -0
  582. /lionagi/{experimental/directive/template → protocols/registries}/__init__.py +0 -0
  583. /lionagi/{experimental/evaluator → strategies}/__init__.py +0 -0
  584. {lionagi-0.4.0.dist-info → lionagi-0.5.0.dist-info/licenses}/LICENSE +0 -0
@@ -0,0 +1,212 @@
1
+ from collections.abc import Callable
2
+ from pathlib import Path
3
+ from typing import Any, Literal
4
+
5
+ from pydantic import BaseModel, Field
6
+
7
+
8
+ class ChunkContentParams(BaseModel):
9
+ """Parameters for chunking text content into smaller pieces.
10
+
11
+ This model defines parameters used by the chunk_content function to split text
12
+ content into chunks, with support for both character-based and token-based chunking.
13
+ """
14
+
15
+ content: str = Field(description="The text content to be chunked")
16
+ chunk_by: Literal["chars", "tokens"] = Field(
17
+ default="chars",
18
+ description="Method to use for chunking: 'chars' for character-based or 'tokens' for token-based",
19
+ )
20
+ tokenizer: Callable[[str], list[str]] | None = Field(
21
+ default=None,
22
+ description="Function to use for tokenization. Defaults to str.split if None",
23
+ )
24
+ chunk_size: int = Field(
25
+ default=1024, ge=1, description="Target size for each chunk"
26
+ )
27
+ overlap: float = Field(
28
+ default=0.0,
29
+ ge=0.0,
30
+ le=1.0,
31
+ description="Fraction of overlap between chunks (0.0 to 1.0)",
32
+ )
33
+ threshold: int = Field(
34
+ default=256,
35
+ ge=0,
36
+ description="Minimum size threshold for the last chunk",
37
+ )
38
+ metadata: dict[str, Any] = Field(
39
+ default_factory=dict,
40
+ description="Additional metadata to include with each chunk",
41
+ )
42
+ return_tokens: bool = Field(
43
+ default=False,
44
+ description="If True, return chunks as token lists; if False, return as joined strings",
45
+ )
46
+
47
+
48
+ class CreatePathParams(BaseModel):
49
+ """Parameters for creating file paths with various options.
50
+
51
+ This model defines parameters used by the create_path function to generate
52
+ file paths with support for timestamps, random hashes, and existence checks.
53
+ """
54
+
55
+ directory: Path | str = Field(
56
+ description="Directory where the file will be created"
57
+ )
58
+ filename: str = Field(description="Base name of the file to create")
59
+ extension: str | None = Field(
60
+ default=None,
61
+ description="File extension (with or without leading dot)",
62
+ )
63
+ timestamp: bool = Field(
64
+ default=False, description="If True, adds a timestamp to the filename"
65
+ )
66
+ dir_exist_ok: bool = Field(
67
+ default=True,
68
+ description="If True, doesn't raise an error if the directory exists",
69
+ )
70
+ file_exist_ok: bool = Field(
71
+ default=False,
72
+ description="If True, allows overwriting of existing files",
73
+ )
74
+ time_prefix: bool = Field(
75
+ default=False,
76
+ description="If True, adds timestamp as prefix instead of suffix",
77
+ )
78
+ timestamp_format: str | None = Field(
79
+ default=None,
80
+ description="Custom format for the timestamp (strftime format)",
81
+ )
82
+ random_hash_digits: int = Field(
83
+ default=0,
84
+ ge=0,
85
+ description="Number of random hash digits to append to filename",
86
+ )
87
+
88
+
89
+ class DirToFilesParams(BaseModel):
90
+ """Parameters for processing directories and collecting file paths.
91
+
92
+ This model defines parameters used by the dir_to_files function to recursively
93
+ process directories and collect matching file paths.
94
+ """
95
+
96
+ directory: Path | str = Field(
97
+ description="Directory to process recursively"
98
+ )
99
+ file_types: list[str] | None = Field(
100
+ default=None,
101
+ description="List of file extensions to include (e.g., ['.txt', '.pdf']). If None, includes all types",
102
+ )
103
+ max_workers: int | None = Field(
104
+ default=None,
105
+ description="Maximum number of worker threads for concurrent processing",
106
+ )
107
+ ignore_errors: bool = Field(
108
+ default=False,
109
+ description="If True, log warnings for errors instead of raising exceptions",
110
+ )
111
+ verbose: bool = Field(
112
+ default=False,
113
+ description="If True, print verbose output during processing",
114
+ )
115
+
116
+
117
+ class FileToChunksParams(BaseModel):
118
+ """Parameters for splitting file content into chunks.
119
+
120
+ This model defines parameters used by the file_to_chunks function to read
121
+ and split file content into chunks with metadata.
122
+ """
123
+
124
+ file_path: Path | str = Field(
125
+ description="Path to the file to be processed"
126
+ )
127
+ chunk_func: Callable[[str, int, float, int], list[str]] = Field(
128
+ description="Function to use for chunking the content"
129
+ )
130
+ chunk_size: int = Field(
131
+ default=1500, ge=1, description="Target size for each chunk"
132
+ )
133
+ overlap: float = Field(
134
+ default=0.1,
135
+ ge=0.0,
136
+ le=1.0,
137
+ description="Fraction of overlap between chunks (0.0 to 1.0)",
138
+ )
139
+ threshold: int = Field(
140
+ default=200,
141
+ ge=0,
142
+ description="Minimum size threshold for the last chunk",
143
+ )
144
+ encoding: str = Field(
145
+ default="utf-8",
146
+ description="File encoding to use when reading the file",
147
+ )
148
+ custom_metadata: dict[str, Any] | None = Field(
149
+ default=None,
150
+ description="Additional metadata to include with each chunk",
151
+ )
152
+ output_dir: Path | str | None = Field(
153
+ default=None,
154
+ description="Directory to save output chunks (if provided)",
155
+ )
156
+ verbose: bool = Field(
157
+ default=False,
158
+ description="If True, print verbose output during processing",
159
+ )
160
+ timestamp: bool = Field(
161
+ default=True,
162
+ description="If True, include timestamp in output filenames",
163
+ )
164
+ random_hash_digits: int = Field(
165
+ default=4,
166
+ ge=0,
167
+ description="Number of random hash digits to include in output filenames",
168
+ )
169
+
170
+
171
+ class SaveToFileParams(BaseModel):
172
+ """Parameters for saving text content to a file.
173
+
174
+ This model defines parameters used by the save_to_file function to save
175
+ text content to a file with various options for naming and handling.
176
+ """
177
+
178
+ text: str = Field(description="The text content to save to file")
179
+ directory: Path | str = Field(
180
+ description="Directory where the file will be saved"
181
+ )
182
+ filename: str = Field(description="Name of the file to create")
183
+ extension: str | None = Field(
184
+ default=None,
185
+ description="File extension (with or without leading dot)",
186
+ )
187
+ timestamp: bool = Field(
188
+ default=False, description="If True, append timestamp to filename"
189
+ )
190
+ dir_exist_ok: bool = Field(
191
+ default=True,
192
+ description="If True, creates directory if it doesn't exist",
193
+ )
194
+ file_exist_ok: bool = Field(
195
+ default=False, description="If True, allows overwriting existing files"
196
+ )
197
+ time_prefix: bool = Field(
198
+ default=False,
199
+ description="If True, prepend timestamp instead of append",
200
+ )
201
+ timestamp_format: str | None = Field(
202
+ default=None,
203
+ description="Custom format for timestamp (strftime format)",
204
+ )
205
+ random_hash_digits: int = Field(
206
+ default=0,
207
+ ge=0,
208
+ description="Number of random hash digits to append to filename",
209
+ )
210
+ verbose: bool = Field(
211
+ default=True, description="If True, logs the file path after saving"
212
+ )
@@ -0,0 +1,301 @@
1
+ import logging
2
+ import re
3
+ import sys
4
+ from datetime import datetime
5
+ from pathlib import Path
6
+ from typing import Any
7
+
8
+ from ..utils import unique_hash
9
+
10
+
11
+ def create_path(
12
+ directory: Path | str,
13
+ filename: str,
14
+ extension: str = None,
15
+ timestamp: bool = False,
16
+ dir_exist_ok: bool = True,
17
+ file_exist_ok: bool = False,
18
+ time_prefix: bool = False,
19
+ timestamp_format: str | None = None,
20
+ random_hash_digits: int = 0,
21
+ ) -> Path:
22
+ """
23
+ Generate a new file path with optional timestamp and random hash.
24
+
25
+ Args:
26
+ directory: The directory where the file will be created.
27
+ filename: The base name of the file to create.
28
+ timestamp: If True, adds a timestamp to the filename.
29
+ dir_exist_ok: If True, doesn't raise an error if the directory
30
+ exists.
31
+ file_exist_ok: If True, allows overwriting of existing files.
32
+ time_prefix: If True, adds the timestamp as a prefix instead of
33
+ a suffix.
34
+ timestamp_format: Custom format for the timestamp.
35
+ random_hash_digits: Number of digits for the random hash.
36
+
37
+ Returns:
38
+ The full path to the new or existing file.
39
+
40
+ Raises:
41
+ ValueError: If the filename contains illegal characters.
42
+ FileExistsError: If the file exists and file_exist_ok is False.
43
+ """
44
+ if "/" in filename or "\\" in filename:
45
+ raise ValueError("Filename cannot contain directory separators.")
46
+ directory = Path(directory)
47
+
48
+ name, ext = None, None
49
+ if "." in filename:
50
+ name, ext = filename.rsplit(".", 1)
51
+ else:
52
+ name = filename
53
+ ext = extension.strip(".").strip() if extension else None
54
+
55
+ if not ext:
56
+ raise ValueError("No extension provided for filename.")
57
+
58
+ ext = f".{ext}" if ext else ""
59
+
60
+ if timestamp:
61
+ timestamp_str = datetime.now().strftime(
62
+ timestamp_format or "%Y%m%d%H%M%S"
63
+ )
64
+ name = (
65
+ f"{timestamp_str}_{name}"
66
+ if time_prefix
67
+ else f"{name}_{timestamp_str}"
68
+ )
69
+
70
+ if random_hash_digits > 0:
71
+ random_hash = "-" + unique_hash(random_hash_digits)
72
+ name = f"{name}{random_hash}"
73
+
74
+ full_filename = f"{name}{ext}"
75
+ full_path = directory / full_filename
76
+
77
+ if full_path.exists():
78
+ if file_exist_ok:
79
+ return full_path
80
+ raise FileExistsError(
81
+ f"File {full_path} already exists and file_exist_ok is False."
82
+ )
83
+ full_path.parent.mkdir(parents=True, exist_ok=dir_exist_ok)
84
+ return full_path
85
+
86
+
87
+ def is_valid_path(
88
+ path: str | Path,
89
+ *,
90
+ max_length: int | None = None,
91
+ allow_relative: bool = True,
92
+ allow_symlinks: bool = True,
93
+ custom_reserved_names: list[str] | None = None,
94
+ strict_mode: bool = False,
95
+ ) -> bool:
96
+ """
97
+ Validates whether the given path is syntactically valid for the current operating system.
98
+
99
+ Args:
100
+ path (Union[str, Path]): The filesystem path to validate.
101
+ max_length (Optional[int]): Maximum allowed path length. If None, uses OS default.
102
+ allow_relative (bool): Whether to allow relative paths. Default is True.
103
+ allow_symlinks (bool): Whether to allow symlinks. Default is True.
104
+ custom_reserved_names (Optional[List[str]]): Additional reserved names to check.
105
+ strict_mode (bool): If True, applies stricter validation rules. Default is False.
106
+
107
+ Returns:
108
+ bool: True if the path is valid, False otherwise.
109
+
110
+ Raises:
111
+ ValueError: If the path is invalid, with a detailed explanation.
112
+ """
113
+ if isinstance(path, Path):
114
+ path_str = str(path)
115
+ elif isinstance(path, str):
116
+ path_str = path
117
+ else:
118
+ raise TypeError("Path must be a string or Path object.")
119
+
120
+ if not path_str:
121
+ raise ValueError("Path cannot be an empty string.")
122
+
123
+ issues = []
124
+ is_windows = sys.platform.startswith("win")
125
+
126
+ # Common checks for both Windows and Unix-like systems
127
+ if "\0" in path_str:
128
+ issues.append("Path contains null character.")
129
+
130
+ if not max_length:
131
+ max_length = 260 if is_windows else 4096
132
+ if len(path_str) > max_length:
133
+ issues.append(
134
+ f"Path exceeds the maximum length of {max_length} characters."
135
+ )
136
+
137
+ if is_windows:
138
+ # Windows-specific validation
139
+ invalid_chars = r'<>:"/\\|?*'
140
+ if re.search(f"[{re.escape(invalid_chars)}]", path_str):
141
+ issues.append(f"Path contains invalid characters: {invalid_chars}")
142
+
143
+ reserved_names = {
144
+ "CON",
145
+ "PRN",
146
+ "AUX",
147
+ "NUL",
148
+ "COM1",
149
+ "COM2",
150
+ "COM3",
151
+ "COM4",
152
+ "COM5",
153
+ "COM6",
154
+ "COM7",
155
+ "COM8",
156
+ "COM9",
157
+ "LPT1",
158
+ "LPT2",
159
+ "LPT3",
160
+ "LPT4",
161
+ "LPT5",
162
+ "LPT6",
163
+ "LPT7",
164
+ "LPT8",
165
+ "LPT9",
166
+ }
167
+ if custom_reserved_names:
168
+ reserved_names.update(custom_reserved_names)
169
+
170
+ path = Path(path_str)
171
+ for part in path.parts:
172
+ name = part.upper().rstrip(". ")
173
+ if name in reserved_names:
174
+ issues.append(f"Path contains a reserved name: '{part}'")
175
+
176
+ if path_str.endswith(" ") or path_str.endswith("."):
177
+ issues.append(
178
+ "Path cannot end with a space or a period on Windows."
179
+ )
180
+
181
+ if strict_mode:
182
+ if not path_str.startswith("\\\\?\\") and len(path_str) > 260:
183
+ issues.append(
184
+ "Path exceeds 260 characters without long path prefix."
185
+ )
186
+
187
+ else:
188
+ # Unix-like systems validation
189
+ if strict_mode:
190
+ if re.search(r"//+", path_str):
191
+ issues.append("Path contains consecutive slashes.")
192
+
193
+ if not allow_relative and not path_str.startswith("/"):
194
+ issues.append("Relative paths are not allowed.")
195
+
196
+ # Common additional checks
197
+ if not allow_symlinks and Path(path_str).is_symlink():
198
+ issues.append("Symlinks are not allowed.")
199
+
200
+ if strict_mode:
201
+ if re.search(r"\s", path_str):
202
+ issues.append("Path contains whitespace characters.")
203
+
204
+ if issues:
205
+ raise ValueError("Invalid path: " + "; ".join(issues))
206
+
207
+ return True
208
+
209
+
210
+ def split_path(path: Path | str) -> tuple[Path, str]:
211
+ """
212
+ Split a path into its directory and filename components.
213
+
214
+ Args:
215
+ path: The path to split.
216
+
217
+ Returns:
218
+ A tuple containing the directory and filename.
219
+ """
220
+ path = Path(path)
221
+ return path.parent, path.name
222
+
223
+
224
+ def _get_path_kwargs(
225
+ persist_path: str | Path, postfix: str, **path_kwargs: Any
226
+ ) -> dict[str, Any]:
227
+ """
228
+ Generate keyword arguments for path creation.
229
+
230
+ Args:
231
+ persist_path: The base path to use.
232
+ postfix: The file extension to use.
233
+ **path_kwargs: Additional keyword arguments to override defaults.
234
+
235
+ Returns:
236
+ A dictionary of keyword arguments for path creation.
237
+ """
238
+ persist_path = Path(persist_path)
239
+ postfix = f".{postfix.strip('.')}"
240
+
241
+ if persist_path.suffix != postfix:
242
+ dirname = persist_path
243
+ filename = f"new_file{postfix}"
244
+ else:
245
+ dirname, filename = persist_path.parent, persist_path.name
246
+
247
+ return {
248
+ "timestamp": path_kwargs.get("timestamp", False),
249
+ "file_exist_ok": path_kwargs.get("file_exist_ok", True),
250
+ "directory": path_kwargs.get("directory", dirname),
251
+ "filename": path_kwargs.get("filename", filename),
252
+ }
253
+
254
+
255
+ def clear_path(
256
+ path: Path | str,
257
+ /,
258
+ recursive: bool = False,
259
+ exclude: list[str] | None = None,
260
+ ) -> None:
261
+ """
262
+ Clear all files and directories in the specified path.
263
+
264
+ Args:
265
+ path: The path to the directory to clear.
266
+ recursive: If True, clears directories recursively.
267
+ exclude: A list of string patterns to exclude from deletion.
268
+
269
+ Raises:
270
+ FileNotFoundError: If the specified directory does not exist.
271
+ PermissionError: If there are insufficient permissions to delete
272
+ files.
273
+ """
274
+ path = Path(path)
275
+ if not path.exists():
276
+ raise FileNotFoundError(
277
+ f"The specified directory {path} does not exist."
278
+ )
279
+
280
+ exclude = exclude or []
281
+ exclude_pattern = re.compile("|".join(exclude)) if exclude else None
282
+
283
+ for file_path in path.iterdir():
284
+ if exclude_pattern and exclude_pattern.search(file_path.name):
285
+ logging.info(f"Excluded from deletion: {file_path}")
286
+ continue
287
+
288
+ try:
289
+ if file_path.is_dir():
290
+ if recursive:
291
+ clear_path(file_path, recursive=True, exclude=exclude)
292
+ file_path.rmdir()
293
+ else:
294
+ continue
295
+ else:
296
+ file_path.unlink()
297
+ logging.info(f"Successfully deleted {file_path}")
298
+ except PermissionError as e:
299
+ logging.error(f"Permission denied when deleting {file_path}: {e}")
300
+ except Exception as e:
301
+ logging.error(f"Failed to delete {file_path}: {e}")
@@ -0,0 +1,139 @@
1
+ import logging
2
+ from collections.abc import Callable
3
+ from concurrent.futures import ThreadPoolExecutor, as_completed
4
+ from pathlib import Path
5
+ from typing import Any
6
+
7
+ from .chunk import chunk_content
8
+ from .save import save_chunks
9
+
10
+
11
+ def dir_to_files(
12
+ directory: str | Path,
13
+ file_types: list[str] | None = None,
14
+ max_workers: int | None = None,
15
+ ignore_errors: bool = False,
16
+ verbose: bool = False,
17
+ ) -> list[Path]:
18
+ """
19
+ Recursively process a directory and return a list of file paths.
20
+
21
+ This function walks through the given directory and its subdirectories,
22
+ collecting file paths that match the specified file types (if any).
23
+
24
+ Args:
25
+ directory (Union[str, Path]): The directory to process.
26
+ file_types (Optional[List[str]]): List of file extensions to include (e.g., ['.txt', '.pdf']).
27
+ If None, include all file types.
28
+ max_workers (Optional[int]): Maximum number of worker threads for concurrent processing.
29
+ If None, uses the default ThreadPoolExecutor behavior.
30
+ ignore_errors (bool): If True, log warnings for errors instead of raising exceptions.
31
+ verbose (bool): If True, print verbose output.
32
+
33
+ Returns:
34
+ List[Path]: A list of Path objects representing the files found.
35
+
36
+ Raises:
37
+ ValueError: If the provided directory doesn't exist or isn't a directory.
38
+ """
39
+ directory_path = Path(directory)
40
+ if not directory_path.is_dir():
41
+ raise ValueError(
42
+ f"The provided path is not a valid directory: {directory}"
43
+ )
44
+
45
+ def process_file(file_path: Path) -> Path | None:
46
+ try:
47
+ if file_types is None or file_path.suffix in file_types:
48
+ return file_path
49
+ except Exception as e:
50
+ if ignore_errors:
51
+ if verbose:
52
+ logging.warning(f"Error processing {file_path}: {e}")
53
+ else:
54
+ raise ValueError(f"Error processing {file_path}: {e}") from e
55
+ return None
56
+
57
+ try:
58
+ with ThreadPoolExecutor(max_workers=max_workers) as executor:
59
+ futures = [
60
+ executor.submit(process_file, f)
61
+ for f in directory_path.rglob("*")
62
+ if f.is_file()
63
+ ]
64
+ files = [
65
+ future.result()
66
+ for future in as_completed(futures)
67
+ if future.result() is not None
68
+ ]
69
+
70
+ if verbose:
71
+ logging.info(f"Processed {len(files)} files from {directory}")
72
+
73
+ return files
74
+ except Exception as e:
75
+ raise ValueError(f"Error processing directory {directory}: {e}") from e
76
+
77
+
78
+ def file_to_chunks(
79
+ file_path: str | Path,
80
+ chunk_func: Callable[[str, int, float, int], list[str]],
81
+ chunk_size: int = 1500,
82
+ overlap: float = 0.1,
83
+ threshold: int = 200,
84
+ encoding: str = "utf-8",
85
+ custom_metadata: dict[str, Any] | None = None,
86
+ output_dir: str | Path | None = None,
87
+ verbose: bool = False,
88
+ timestamp: bool = True,
89
+ random_hash_digits: int = 4,
90
+ ) -> list[dict[str, Any]]:
91
+ """
92
+ Process a file and split its content into chunks.
93
+
94
+ This function reads a file, splits its content into chunks using the provided
95
+ chunking function, and optionally saves the chunks to separate files.
96
+
97
+ Args:
98
+ file_path (Union[str, Path]): Path to the file to be processed.
99
+ chunk_func (Callable): Function to use for chunking the content.
100
+ chunk_size (int): The target size for each chunk.
101
+ overlap (float): The fraction of overlap between chunks.
102
+ threshold (int): The minimum size for the last chunk.
103
+ encoding (str): File encoding to use when reading the file.
104
+ custom_metadata (Optional[Dict[str, Any]]): Additional metadata to include with each chunk.
105
+ output_dir (Optional[Union[str, Path]]): Directory to save output chunks (if provided).
106
+ verbose (bool): If True, print verbose output.
107
+ timestamp (bool): If True, include timestamp in output filenames.
108
+ random_hash_digits (int): Number of random hash digits to include in output filenames.
109
+
110
+ Returns:
111
+ List[Dict[str, Any]]: A list of dictionaries, each representing a chunk with metadata.
112
+
113
+ Raises:
114
+ ValueError: If there's an error processing the file.
115
+ """
116
+ try:
117
+ file_path = Path(file_path)
118
+ with open(file_path, encoding=encoding) as f:
119
+ content = f.read()
120
+
121
+ metadata = {
122
+ "file_path": str(file_path),
123
+ "file_name": file_path.name,
124
+ "file_size": file_path.stat().st_size,
125
+ **(custom_metadata or {}),
126
+ }
127
+
128
+ chunks = chunk_content(
129
+ content, chunk_func, chunk_size, overlap, threshold, metadata
130
+ )
131
+
132
+ if output_dir:
133
+ save_chunks(
134
+ chunks, output_dir, verbose, timestamp, random_hash_digits
135
+ )
136
+
137
+ return chunks
138
+ except Exception as e:
139
+ raise ValueError(f"Error processing file {file_path}: {e}") from e