lionagi 0.4.0__py3-none-any.whl → 0.5.0__py3-none-any.whl
Sign up to get free protection for your applications and to get access to all the features.
- lionagi/__init__.py +14 -46
- lionagi/core/__init__.py +3 -1
- lionagi/core/_class_registry.py +69 -0
- lionagi/core/action/__init__.py +3 -13
- lionagi/core/action/action_manager.py +287 -0
- lionagi/core/action/base.py +109 -0
- lionagi/core/action/function_calling.py +127 -92
- lionagi/core/action/tool.py +172 -70
- lionagi/core/action/types.py +16 -0
- lionagi/core/communication/__init__.py +3 -0
- lionagi/core/communication/action_request.py +163 -0
- lionagi/core/communication/action_response.py +149 -0
- lionagi/core/communication/assistant_response.py +161 -0
- lionagi/core/communication/base_mail.py +49 -0
- lionagi/core/communication/instruction.py +376 -0
- lionagi/core/communication/message.py +286 -0
- lionagi/core/communication/message_manager.py +530 -0
- lionagi/core/communication/system.py +116 -0
- lionagi/core/communication/templates/README.md +28 -0
- lionagi/core/communication/templates/action_request.jinja2 +5 -0
- lionagi/core/communication/templates/action_response.jinja2 +9 -0
- lionagi/core/communication/templates/assistant_response.jinja2 +2 -0
- lionagi/core/communication/templates/instruction_message.jinja2 +61 -0
- lionagi/core/communication/templates/system_message.jinja2 +11 -0
- lionagi/core/communication/templates/tool_schemas.jinja2 +7 -0
- lionagi/core/communication/types.py +27 -0
- lionagi/core/communication/utils.py +254 -0
- lionagi/core/forms/__init__.py +3 -0
- lionagi/core/forms/base.py +232 -0
- lionagi/core/forms/form.py +791 -0
- lionagi/core/forms/report.py +321 -0
- lionagi/core/forms/types.py +13 -0
- lionagi/core/forms/utils.py +26 -0
- lionagi/core/generic/__init__.py +3 -6
- lionagi/core/generic/component.py +422 -0
- lionagi/core/generic/edge.py +143 -101
- lionagi/core/generic/element.py +195 -0
- lionagi/core/generic/graph.py +297 -180
- lionagi/core/generic/log.py +151 -0
- lionagi/core/generic/log_manager.py +320 -0
- lionagi/core/generic/node.py +7 -229
- lionagi/core/generic/pile.py +1017 -0
- lionagi/core/generic/progression.py +388 -0
- lionagi/core/generic/types.py +23 -0
- lionagi/core/generic/utils.py +50 -0
- lionagi/core/models/__init__.py +5 -0
- lionagi/core/models/base.py +85 -0
- lionagi/core/models/field_model.py +122 -0
- lionagi/core/models/new_model_params.py +195 -0
- lionagi/core/models/note.py +351 -0
- lionagi/core/models/operable_model.py +392 -0
- lionagi/core/models/schema_model.py +50 -0
- lionagi/core/models/types.py +10 -0
- lionagi/core/session/__init__.py +3 -0
- lionagi/core/session/branch.py +115 -415
- lionagi/core/session/branch_mixins.py +507 -0
- lionagi/core/session/session.py +122 -257
- lionagi/core/session/types.py +8 -0
- lionagi/core/typing/__init__.py +9 -0
- lionagi/core/typing/concepts.py +132 -0
- lionagi/core/typing/config.py +15 -0
- lionagi/core/typing/id.py +221 -0
- lionagi/core/typing/pydantic_.py +33 -0
- lionagi/core/typing/typing_.py +54 -0
- lionagi/integrations/__init__.py +0 -1
- lionagi/integrations/anthropic_/AnthropicModel.py +268 -0
- lionagi/integrations/anthropic_/AnthropicService.py +113 -0
- lionagi/integrations/anthropic_/__init__.py +3 -0
- lionagi/integrations/anthropic_/anthropic_max_output_token_data.yaml +7 -0
- lionagi/integrations/anthropic_/anthropic_price_data.yaml +14 -0
- lionagi/integrations/anthropic_/api_endpoints/__init__.py +3 -0
- lionagi/integrations/anthropic_/api_endpoints/api_request.py +277 -0
- lionagi/integrations/anthropic_/api_endpoints/data_models.py +40 -0
- lionagi/integrations/anthropic_/api_endpoints/match_response.py +119 -0
- lionagi/integrations/anthropic_/api_endpoints/messages/__init__.py +3 -0
- lionagi/integrations/anthropic_/api_endpoints/messages/request/__init__.py +3 -0
- lionagi/integrations/anthropic_/api_endpoints/messages/request/message_models.py +14 -0
- lionagi/integrations/anthropic_/api_endpoints/messages/request/request_body.py +74 -0
- lionagi/integrations/anthropic_/api_endpoints/messages/response/content_models.py +32 -0
- lionagi/integrations/anthropic_/api_endpoints/messages/response/response_body.py +101 -0
- lionagi/integrations/anthropic_/api_endpoints/messages/response/usage_models.py +25 -0
- lionagi/integrations/anthropic_/version.py +5 -0
- lionagi/integrations/groq_/GroqModel.py +318 -0
- lionagi/integrations/groq_/GroqService.py +147 -0
- lionagi/integrations/groq_/__init__.py +3 -0
- lionagi/integrations/groq_/api_endpoints/data_models.py +187 -0
- lionagi/integrations/groq_/api_endpoints/groq_request.py +288 -0
- lionagi/integrations/groq_/api_endpoints/match_response.py +106 -0
- lionagi/integrations/groq_/api_endpoints/response_utils.py +105 -0
- lionagi/integrations/groq_/groq_max_output_token_data.yaml +21 -0
- lionagi/integrations/groq_/groq_price_data.yaml +58 -0
- lionagi/integrations/groq_/groq_rate_limits.yaml +105 -0
- lionagi/integrations/groq_/version.py +5 -0
- lionagi/integrations/litellm_/__init__.py +3 -0
- lionagi/integrations/litellm_/imodel.py +69 -0
- lionagi/integrations/ollama_/OllamaModel.py +244 -0
- lionagi/integrations/ollama_/OllamaService.py +138 -0
- lionagi/integrations/ollama_/__init__.py +3 -0
- lionagi/integrations/ollama_/api_endpoints/__init__.py +3 -0
- lionagi/integrations/ollama_/api_endpoints/api_request.py +179 -0
- lionagi/integrations/ollama_/api_endpoints/chat_completion/__init__.py +3 -0
- lionagi/integrations/ollama_/api_endpoints/chat_completion/message_models.py +31 -0
- lionagi/integrations/ollama_/api_endpoints/chat_completion/request_body.py +46 -0
- lionagi/integrations/ollama_/api_endpoints/chat_completion/response_body.py +67 -0
- lionagi/integrations/ollama_/api_endpoints/chat_completion/tool_models.py +49 -0
- lionagi/integrations/ollama_/api_endpoints/completion/request_body.py +72 -0
- lionagi/integrations/ollama_/api_endpoints/completion/response_body.py +59 -0
- lionagi/integrations/ollama_/api_endpoints/data_models.py +15 -0
- lionagi/integrations/ollama_/api_endpoints/embedding/request_body.py +33 -0
- lionagi/integrations/ollama_/api_endpoints/embedding/response_body.py +29 -0
- lionagi/integrations/ollama_/api_endpoints/match_data_model.py +62 -0
- lionagi/integrations/ollama_/api_endpoints/match_response.py +190 -0
- lionagi/integrations/ollama_/api_endpoints/model/__init__.py +3 -0
- lionagi/integrations/ollama_/api_endpoints/model/copy_model.py +13 -0
- lionagi/integrations/ollama_/api_endpoints/model/create_model.py +28 -0
- lionagi/integrations/ollama_/api_endpoints/model/delete_model.py +11 -0
- lionagi/integrations/ollama_/api_endpoints/model/list_model.py +60 -0
- lionagi/integrations/ollama_/api_endpoints/model/pull_model.py +34 -0
- lionagi/integrations/ollama_/api_endpoints/model/push_model.py +35 -0
- lionagi/integrations/ollama_/api_endpoints/model/show_model.py +36 -0
- lionagi/integrations/ollama_/api_endpoints/option_models.py +68 -0
- lionagi/integrations/openai_/OpenAIModel.py +414 -0
- lionagi/integrations/openai_/OpenAIService.py +426 -0
- lionagi/integrations/openai_/api_endpoints/__init__.py +3 -0
- lionagi/integrations/openai_/api_endpoints/api_request.py +277 -0
- lionagi/integrations/openai_/api_endpoints/audio/__init__.py +9 -0
- lionagi/integrations/openai_/api_endpoints/audio/speech_models.py +34 -0
- lionagi/integrations/openai_/api_endpoints/audio/transcription_models.py +136 -0
- lionagi/integrations/openai_/api_endpoints/audio/translation_models.py +41 -0
- lionagi/integrations/openai_/api_endpoints/audio/types.py +41 -0
- lionagi/integrations/openai_/api_endpoints/batch/__init__.py +17 -0
- lionagi/integrations/openai_/api_endpoints/batch/batch_models.py +146 -0
- lionagi/integrations/openai_/api_endpoints/batch/cancel_batch.py +7 -0
- lionagi/integrations/openai_/api_endpoints/batch/create_batch.py +26 -0
- lionagi/integrations/openai_/api_endpoints/batch/list_batch.py +37 -0
- lionagi/integrations/openai_/api_endpoints/batch/request_object_models.py +65 -0
- lionagi/integrations/openai_/api_endpoints/batch/retrieve_batch.py +7 -0
- lionagi/integrations/openai_/api_endpoints/batch/types.py +4 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/__init__.py +1 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/__init__.py +39 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/message_models.py +121 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/request_body.py +221 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/response_format.py +71 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/stream_options.py +14 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/tool_choice_models.py +17 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/tool_models.py +54 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/request/types.py +18 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/choice_models.py +62 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/function_models.py +16 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/log_prob_models.py +47 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/message_models.py +25 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/response_body.py +99 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/types.py +8 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/response/usage_models.py +24 -0
- lionagi/integrations/openai_/api_endpoints/chat_completions/util.py +46 -0
- lionagi/integrations/openai_/api_endpoints/data_models.py +23 -0
- lionagi/integrations/openai_/api_endpoints/embeddings/__init__.py +3 -0
- lionagi/integrations/openai_/api_endpoints/embeddings/request_body.py +79 -0
- lionagi/integrations/openai_/api_endpoints/embeddings/response_body.py +67 -0
- lionagi/integrations/openai_/api_endpoints/files/__init__.py +11 -0
- lionagi/integrations/openai_/api_endpoints/files/delete_file.py +20 -0
- lionagi/integrations/openai_/api_endpoints/files/file_models.py +56 -0
- lionagi/integrations/openai_/api_endpoints/files/list_files.py +27 -0
- lionagi/integrations/openai_/api_endpoints/files/retrieve_file.py +9 -0
- lionagi/integrations/openai_/api_endpoints/files/upload_file.py +38 -0
- lionagi/integrations/openai_/api_endpoints/fine_tuning/__init__.py +37 -0
- lionagi/integrations/openai_/api_endpoints/fine_tuning/cancel_jobs.py +9 -0
- lionagi/integrations/openai_/api_endpoints/fine_tuning/create_jobs.py +133 -0
- lionagi/integrations/openai_/api_endpoints/fine_tuning/fine_tuning_job_checkpoint_models.py +58 -0
- lionagi/integrations/openai_/api_endpoints/fine_tuning/fine_tuning_job_event_models.py +31 -0
- lionagi/integrations/openai_/api_endpoints/fine_tuning/fine_tuning_job_models.py +140 -0
- lionagi/integrations/openai_/api_endpoints/fine_tuning/list_fine_tuning_checkpoints.py +51 -0
- lionagi/integrations/openai_/api_endpoints/fine_tuning/list_fine_tuning_events.py +42 -0
- lionagi/integrations/openai_/api_endpoints/fine_tuning/list_fine_tuning_jobs.py +31 -0
- lionagi/integrations/openai_/api_endpoints/fine_tuning/retrieve_jobs.py +9 -0
- lionagi/integrations/openai_/api_endpoints/fine_tuning/training_format.py +30 -0
- lionagi/integrations/openai_/api_endpoints/images/__init__.py +9 -0
- lionagi/integrations/openai_/api_endpoints/images/image_edit_models.py +69 -0
- lionagi/integrations/openai_/api_endpoints/images/image_models.py +56 -0
- lionagi/integrations/openai_/api_endpoints/images/image_variation_models.py +56 -0
- lionagi/integrations/openai_/api_endpoints/images/response_body.py +30 -0
- lionagi/integrations/openai_/api_endpoints/match_data_model.py +197 -0
- lionagi/integrations/openai_/api_endpoints/match_response.py +336 -0
- lionagi/integrations/openai_/api_endpoints/models/__init__.py +7 -0
- lionagi/integrations/openai_/api_endpoints/models/delete_fine_tuned_model.py +17 -0
- lionagi/integrations/openai_/api_endpoints/models/models_models.py +31 -0
- lionagi/integrations/openai_/api_endpoints/models/retrieve_model.py +9 -0
- lionagi/integrations/openai_/api_endpoints/moderations/__init__.py +3 -0
- lionagi/integrations/openai_/api_endpoints/moderations/request_body.py +20 -0
- lionagi/integrations/openai_/api_endpoints/moderations/response_body.py +139 -0
- lionagi/integrations/openai_/api_endpoints/uploads/__init__.py +19 -0
- lionagi/integrations/openai_/api_endpoints/uploads/add_upload_part.py +11 -0
- lionagi/integrations/openai_/api_endpoints/uploads/cancel_upload.py +7 -0
- lionagi/integrations/openai_/api_endpoints/uploads/complete_upload.py +18 -0
- lionagi/integrations/openai_/api_endpoints/uploads/create_upload.py +17 -0
- lionagi/integrations/openai_/api_endpoints/uploads/uploads_models.py +52 -0
- lionagi/integrations/openai_/image_token_calculator/image_token_calculator.py +92 -0
- lionagi/integrations/openai_/image_token_calculator/openai_image_token_data.yaml +15 -0
- lionagi/integrations/openai_/openai_max_output_token_data.yaml +12 -0
- lionagi/integrations/openai_/openai_price_data.yaml +26 -0
- lionagi/integrations/openai_/version.py +1 -0
- lionagi/integrations/pandas_/__init__.py +24 -0
- lionagi/integrations/pandas_/extend_df.py +61 -0
- lionagi/integrations/pandas_/read.py +103 -0
- lionagi/integrations/pandas_/remove_rows.py +61 -0
- lionagi/integrations/pandas_/replace_keywords.py +65 -0
- lionagi/integrations/pandas_/save.py +131 -0
- lionagi/integrations/pandas_/search_keywords.py +69 -0
- lionagi/integrations/pandas_/to_df.py +196 -0
- lionagi/integrations/pandas_/update_cells.py +54 -0
- lionagi/integrations/perplexity_/PerplexityModel.py +269 -0
- lionagi/integrations/perplexity_/PerplexityService.py +109 -0
- lionagi/integrations/perplexity_/__init__.py +3 -0
- lionagi/integrations/perplexity_/api_endpoints/api_request.py +171 -0
- lionagi/integrations/perplexity_/api_endpoints/chat_completions/request/request_body.py +121 -0
- lionagi/integrations/perplexity_/api_endpoints/chat_completions/response/response_body.py +146 -0
- lionagi/integrations/perplexity_/api_endpoints/data_models.py +63 -0
- lionagi/integrations/perplexity_/api_endpoints/match_response.py +26 -0
- lionagi/integrations/perplexity_/perplexity_max_output_token_data.yaml +3 -0
- lionagi/integrations/perplexity_/perplexity_price_data.yaml +10 -0
- lionagi/integrations/perplexity_/version.py +1 -0
- lionagi/integrations/pydantic_/__init__.py +8 -0
- lionagi/integrations/pydantic_/break_down_annotation.py +81 -0
- lionagi/integrations/pydantic_/new_model.py +208 -0
- lionagi/integrations/services.py +17 -0
- lionagi/libs/__init__.py +0 -55
- lionagi/libs/compress/models.py +62 -0
- lionagi/libs/compress/utils.py +81 -0
- lionagi/libs/constants.py +98 -0
- lionagi/libs/file/chunk.py +265 -0
- lionagi/libs/file/file_ops.py +114 -0
- lionagi/libs/file/params.py +212 -0
- lionagi/libs/file/path.py +301 -0
- lionagi/libs/file/process.py +139 -0
- lionagi/libs/file/save.py +90 -0
- lionagi/libs/file/types.py +22 -0
- lionagi/libs/func/async_calls/__init__.py +21 -0
- lionagi/libs/func/async_calls/alcall.py +157 -0
- lionagi/libs/func/async_calls/bcall.py +82 -0
- lionagi/libs/func/async_calls/mcall.py +134 -0
- lionagi/libs/func/async_calls/pcall.py +149 -0
- lionagi/libs/func/async_calls/rcall.py +185 -0
- lionagi/libs/func/async_calls/tcall.py +114 -0
- lionagi/libs/func/async_calls/ucall.py +85 -0
- lionagi/libs/func/decorators.py +277 -0
- lionagi/libs/func/lcall.py +57 -0
- lionagi/libs/func/params.py +64 -0
- lionagi/libs/func/throttle.py +119 -0
- lionagi/libs/func/types.py +39 -0
- lionagi/libs/func/utils.py +96 -0
- lionagi/libs/package/imports.py +162 -0
- lionagi/libs/package/management.py +58 -0
- lionagi/libs/package/params.py +26 -0
- lionagi/libs/package/system.py +18 -0
- lionagi/libs/package/types.py +26 -0
- lionagi/libs/parse/__init__.py +1 -0
- lionagi/libs/parse/flatten/__init__.py +9 -0
- lionagi/libs/parse/flatten/flatten.py +168 -0
- lionagi/libs/parse/flatten/params.py +52 -0
- lionagi/libs/parse/flatten/unflatten.py +79 -0
- lionagi/libs/parse/json/__init__.py +27 -0
- lionagi/libs/parse/json/as_readable.py +104 -0
- lionagi/libs/parse/json/extract.py +102 -0
- lionagi/libs/parse/json/parse.py +179 -0
- lionagi/libs/parse/json/schema.py +227 -0
- lionagi/libs/parse/json/to_json.py +71 -0
- lionagi/libs/parse/nested/__init__.py +33 -0
- lionagi/libs/parse/nested/nfilter.py +55 -0
- lionagi/libs/parse/nested/nget.py +40 -0
- lionagi/libs/parse/nested/ninsert.py +103 -0
- lionagi/libs/parse/nested/nmerge.py +155 -0
- lionagi/libs/parse/nested/npop.py +66 -0
- lionagi/libs/parse/nested/nset.py +89 -0
- lionagi/libs/parse/nested/to_flat_list.py +64 -0
- lionagi/libs/parse/nested/utils.py +185 -0
- lionagi/libs/parse/string_parse/__init__.py +11 -0
- lionagi/libs/parse/string_parse/code_block.py +73 -0
- lionagi/libs/parse/string_parse/docstring.py +179 -0
- lionagi/libs/parse/string_parse/function_.py +92 -0
- lionagi/libs/parse/type_convert/__init__.py +19 -0
- lionagi/libs/parse/type_convert/params.py +145 -0
- lionagi/libs/parse/type_convert/to_dict.py +333 -0
- lionagi/libs/parse/type_convert/to_list.py +186 -0
- lionagi/libs/parse/type_convert/to_num.py +358 -0
- lionagi/libs/parse/type_convert/to_str.py +195 -0
- lionagi/libs/parse/types.py +9 -0
- lionagi/libs/parse/validate/__init__.py +14 -0
- lionagi/libs/parse/validate/boolean.py +96 -0
- lionagi/libs/parse/validate/keys.py +150 -0
- lionagi/libs/parse/validate/mapping.py +109 -0
- lionagi/libs/parse/validate/params.py +62 -0
- lionagi/libs/parse/xml/__init__.py +10 -0
- lionagi/libs/parse/xml/convert.py +56 -0
- lionagi/libs/parse/xml/parser.py +93 -0
- lionagi/libs/string_similarity/__init__.py +32 -0
- lionagi/libs/string_similarity/algorithms.py +219 -0
- lionagi/libs/string_similarity/matcher.py +102 -0
- lionagi/libs/string_similarity/utils.py +15 -0
- lionagi/libs/utils.py +255 -0
- lionagi/operations/__init__.py +3 -6
- lionagi/operations/brainstorm/__init__.py +3 -0
- lionagi/operations/brainstorm/brainstorm.py +204 -0
- lionagi/operations/brainstorm/prompt.py +1 -0
- lionagi/operations/plan/__init__.py +3 -0
- lionagi/operations/plan/plan.py +172 -0
- lionagi/operations/plan/prompt.py +21 -0
- lionagi/operations/select/__init__.py +3 -0
- lionagi/operations/select/prompt.py +1 -0
- lionagi/operations/select/select.py +100 -0
- lionagi/operations/select/utils.py +107 -0
- lionagi/operations/utils.py +35 -0
- lionagi/protocols/adapters/adapter.py +79 -0
- lionagi/protocols/adapters/json_adapter.py +43 -0
- lionagi/protocols/adapters/pandas_adapter.py +96 -0
- lionagi/protocols/configs/__init__.py +15 -0
- lionagi/protocols/configs/branch_config.py +86 -0
- lionagi/protocols/configs/id_config.py +15 -0
- lionagi/protocols/configs/imodel_config.py +73 -0
- lionagi/protocols/configs/log_config.py +93 -0
- lionagi/protocols/configs/retry_config.py +29 -0
- lionagi/protocols/operatives/__init__.py +15 -0
- lionagi/protocols/operatives/action.py +181 -0
- lionagi/protocols/operatives/instruct.py +196 -0
- lionagi/protocols/operatives/operative.py +182 -0
- lionagi/protocols/operatives/prompts.py +232 -0
- lionagi/protocols/operatives/reason.py +56 -0
- lionagi/protocols/operatives/step.py +217 -0
- lionagi/protocols/registries/_component_registry.py +19 -0
- lionagi/protocols/registries/_pile_registry.py +26 -0
- lionagi/service/__init__.py +13 -0
- lionagi/service/complete_request_info.py +11 -0
- lionagi/service/imodel.py +110 -0
- lionagi/service/rate_limiter.py +108 -0
- lionagi/service/service.py +37 -0
- lionagi/service/service_match_util.py +131 -0
- lionagi/service/service_util.py +72 -0
- lionagi/service/token_calculator.py +51 -0
- lionagi/settings.py +136 -0
- lionagi/strategies/base.py +53 -0
- lionagi/strategies/concurrent.py +71 -0
- lionagi/strategies/concurrent_chunk.py +43 -0
- lionagi/strategies/concurrent_sequential_chunk.py +104 -0
- lionagi/strategies/params.py +128 -0
- lionagi/strategies/sequential.py +23 -0
- lionagi/strategies/sequential_chunk.py +89 -0
- lionagi/strategies/sequential_concurrent_chunk.py +100 -0
- lionagi/strategies/types.py +21 -0
- lionagi/strategies/utils.py +49 -0
- lionagi/version.py +1 -1
- lionagi-0.5.0.dist-info/METADATA +348 -0
- lionagi-0.5.0.dist-info/RECORD +373 -0
- {lionagi-0.4.0.dist-info → lionagi-0.5.0.dist-info}/WHEEL +1 -1
- lionagi/core/_setting/_setting.py +0 -59
- lionagi/core/action/README.md +0 -20
- lionagi/core/action/manual.py +0 -1
- lionagi/core/action/node.py +0 -94
- lionagi/core/action/tool_manager.py +0 -342
- lionagi/core/agent/README.md +0 -1
- lionagi/core/agent/base_agent.py +0 -82
- lionagi/core/agent/eval/README.md +0 -1
- lionagi/core/agent/eval/evaluator.py +0 -1
- lionagi/core/agent/eval/vote.py +0 -40
- lionagi/core/agent/learn/learner.py +0 -59
- lionagi/core/agent/plan/unit_template.py +0 -1
- lionagi/core/collections/README.md +0 -23
- lionagi/core/collections/__init__.py +0 -16
- lionagi/core/collections/_logger.py +0 -312
- lionagi/core/collections/abc/README.md +0 -63
- lionagi/core/collections/abc/__init__.py +0 -53
- lionagi/core/collections/abc/component.py +0 -620
- lionagi/core/collections/abc/concepts.py +0 -277
- lionagi/core/collections/abc/exceptions.py +0 -136
- lionagi/core/collections/abc/util.py +0 -45
- lionagi/core/collections/exchange.py +0 -146
- lionagi/core/collections/flow.py +0 -416
- lionagi/core/collections/model.py +0 -465
- lionagi/core/collections/pile.py +0 -1232
- lionagi/core/collections/progression.py +0 -221
- lionagi/core/collections/util.py +0 -73
- lionagi/core/director/README.md +0 -1
- lionagi/core/director/direct.py +0 -298
- lionagi/core/director/director.py +0 -2
- lionagi/core/director/operations/select.py +0 -3
- lionagi/core/director/operations/utils.py +0 -6
- lionagi/core/engine/branch_engine.py +0 -361
- lionagi/core/engine/instruction_map_engine.py +0 -213
- lionagi/core/engine/sandbox_.py +0 -16
- lionagi/core/engine/script_engine.py +0 -89
- lionagi/core/executor/base_executor.py +0 -97
- lionagi/core/executor/graph_executor.py +0 -335
- lionagi/core/executor/neo4j_executor.py +0 -394
- lionagi/core/generic/README.md +0 -0
- lionagi/core/generic/edge_condition.py +0 -17
- lionagi/core/generic/hyperedge.py +0 -1
- lionagi/core/generic/tree.py +0 -49
- lionagi/core/generic/tree_node.py +0 -85
- lionagi/core/mail/__init__.py +0 -11
- lionagi/core/mail/mail.py +0 -26
- lionagi/core/mail/mail_manager.py +0 -185
- lionagi/core/mail/package.py +0 -49
- lionagi/core/mail/start_mail.py +0 -36
- lionagi/core/message/__init__.py +0 -18
- lionagi/core/message/action_request.py +0 -114
- lionagi/core/message/action_response.py +0 -121
- lionagi/core/message/assistant_response.py +0 -80
- lionagi/core/message/instruction.py +0 -194
- lionagi/core/message/message.py +0 -86
- lionagi/core/message/system.py +0 -71
- lionagi/core/message/util.py +0 -274
- lionagi/core/report/__init__.py +0 -4
- lionagi/core/report/base.py +0 -201
- lionagi/core/report/form.py +0 -212
- lionagi/core/report/report.py +0 -150
- lionagi/core/report/util.py +0 -15
- lionagi/core/rule/_default.py +0 -17
- lionagi/core/rule/action.py +0 -87
- lionagi/core/rule/base.py +0 -234
- lionagi/core/rule/boolean.py +0 -56
- lionagi/core/rule/choice.py +0 -48
- lionagi/core/rule/mapping.py +0 -82
- lionagi/core/rule/number.py +0 -73
- lionagi/core/rule/rulebook.py +0 -45
- lionagi/core/rule/string.py +0 -43
- lionagi/core/rule/util.py +0 -0
- lionagi/core/session/directive_mixin.py +0 -307
- lionagi/core/structure/__init__.py +0 -1
- lionagi/core/structure/chain.py +0 -1
- lionagi/core/structure/forest.py +0 -1
- lionagi/core/structure/graph.py +0 -1
- lionagi/core/structure/tree.py +0 -1
- lionagi/core/unit/__init__.py +0 -4
- lionagi/core/unit/parallel_unit.py +0 -234
- lionagi/core/unit/template/action.py +0 -65
- lionagi/core/unit/template/base.py +0 -35
- lionagi/core/unit/template/plan.py +0 -69
- lionagi/core/unit/template/predict.py +0 -95
- lionagi/core/unit/template/score.py +0 -108
- lionagi/core/unit/template/select.py +0 -91
- lionagi/core/unit/unit.py +0 -452
- lionagi/core/unit/unit_form.py +0 -290
- lionagi/core/unit/unit_mixin.py +0 -1166
- lionagi/core/unit/util.py +0 -103
- lionagi/core/validator/validator.py +0 -376
- lionagi/core/work/work.py +0 -59
- lionagi/core/work/work_edge.py +0 -102
- lionagi/core/work/work_function.py +0 -114
- lionagi/core/work/work_function_node.py +0 -50
- lionagi/core/work/work_queue.py +0 -90
- lionagi/core/work/work_task.py +0 -151
- lionagi/core/work/worker.py +0 -410
- lionagi/core/work/worker_engine.py +0 -208
- lionagi/core/work/worklog.py +0 -108
- lionagi/experimental/compressor/base.py +0 -47
- lionagi/experimental/compressor/llm_compressor.py +0 -265
- lionagi/experimental/compressor/llm_summarizer.py +0 -61
- lionagi/experimental/compressor/util.py +0 -70
- lionagi/experimental/directive/README.md +0 -1
- lionagi/experimental/directive/__init__.py +0 -19
- lionagi/experimental/directive/parser/base_parser.py +0 -294
- lionagi/experimental/directive/parser/base_syntax.txt +0 -200
- lionagi/experimental/directive/template/base_template.py +0 -71
- lionagi/experimental/directive/template/schema.py +0 -36
- lionagi/experimental/directive/tokenizer.py +0 -59
- lionagi/experimental/evaluator/README.md +0 -1
- lionagi/experimental/evaluator/ast_evaluator.py +0 -119
- lionagi/experimental/evaluator/base_evaluator.py +0 -213
- lionagi/experimental/knowledge/__init__.py +0 -0
- lionagi/experimental/knowledge/base.py +0 -10
- lionagi/experimental/knowledge/graph.py +0 -0
- lionagi/experimental/memory/__init__.py +0 -0
- lionagi/experimental/strategies/__init__.py +0 -0
- lionagi/experimental/strategies/base.py +0 -1
- lionagi/integrations/bridge/__init__.py +0 -4
- lionagi/integrations/bridge/autogen_/__init__.py +0 -0
- lionagi/integrations/bridge/autogen_/autogen_.py +0 -127
- lionagi/integrations/bridge/langchain_/__init__.py +0 -0
- lionagi/integrations/bridge/langchain_/documents.py +0 -138
- lionagi/integrations/bridge/langchain_/langchain_bridge.py +0 -68
- lionagi/integrations/bridge/llamaindex_/__init__.py +0 -0
- lionagi/integrations/bridge/llamaindex_/index.py +0 -36
- lionagi/integrations/bridge/llamaindex_/llama_index_bridge.py +0 -108
- lionagi/integrations/bridge/llamaindex_/llama_pack.py +0 -256
- lionagi/integrations/bridge/llamaindex_/node_parser.py +0 -92
- lionagi/integrations/bridge/llamaindex_/reader.py +0 -201
- lionagi/integrations/bridge/llamaindex_/textnode.py +0 -59
- lionagi/integrations/bridge/pydantic_/__init__.py +0 -0
- lionagi/integrations/bridge/pydantic_/pydantic_bridge.py +0 -7
- lionagi/integrations/bridge/transformers_/__init__.py +0 -0
- lionagi/integrations/bridge/transformers_/install_.py +0 -39
- lionagi/integrations/chunker/__init__.py +0 -0
- lionagi/integrations/chunker/chunk.py +0 -314
- lionagi/integrations/config/__init__.py +0 -4
- lionagi/integrations/config/mlx_configs.py +0 -1
- lionagi/integrations/config/oai_configs.py +0 -154
- lionagi/integrations/config/ollama_configs.py +0 -1
- lionagi/integrations/config/openrouter_configs.py +0 -74
- lionagi/integrations/langchain_/__init__.py +0 -0
- lionagi/integrations/llamaindex_/__init__.py +0 -0
- lionagi/integrations/loader/__init__.py +0 -0
- lionagi/integrations/loader/load.py +0 -257
- lionagi/integrations/loader/load_util.py +0 -214
- lionagi/integrations/provider/__init__.py +0 -11
- lionagi/integrations/provider/_mapping.py +0 -47
- lionagi/integrations/provider/litellm.py +0 -53
- lionagi/integrations/provider/mistralai.py +0 -1
- lionagi/integrations/provider/mlx_service.py +0 -55
- lionagi/integrations/provider/oai.py +0 -196
- lionagi/integrations/provider/ollama.py +0 -55
- lionagi/integrations/provider/openrouter.py +0 -170
- lionagi/integrations/provider/services.py +0 -138
- lionagi/integrations/provider/transformers.py +0 -108
- lionagi/integrations/storage/__init__.py +0 -3
- lionagi/integrations/storage/neo4j.py +0 -681
- lionagi/integrations/storage/storage_util.py +0 -302
- lionagi/integrations/storage/structure_excel.py +0 -291
- lionagi/integrations/storage/to_csv.py +0 -70
- lionagi/integrations/storage/to_excel.py +0 -91
- lionagi/libs/ln_api.py +0 -944
- lionagi/libs/ln_async.py +0 -208
- lionagi/libs/ln_context.py +0 -37
- lionagi/libs/ln_convert.py +0 -671
- lionagi/libs/ln_dataframe.py +0 -187
- lionagi/libs/ln_func_call.py +0 -1328
- lionagi/libs/ln_image.py +0 -114
- lionagi/libs/ln_knowledge_graph.py +0 -422
- lionagi/libs/ln_nested.py +0 -822
- lionagi/libs/ln_parse.py +0 -750
- lionagi/libs/ln_queue.py +0 -107
- lionagi/libs/ln_tokenize.py +0 -179
- lionagi/libs/ln_validate.py +0 -299
- lionagi/libs/special_tokens.py +0 -172
- lionagi/libs/sys_util.py +0 -710
- lionagi/lions/__init__.py +0 -0
- lionagi/lions/coder/__init__.py +0 -0
- lionagi/lions/coder/add_feature.py +0 -20
- lionagi/lions/coder/base_prompts.py +0 -22
- lionagi/lions/coder/code_form.py +0 -15
- lionagi/lions/coder/coder.py +0 -184
- lionagi/lions/coder/util.py +0 -101
- lionagi/lions/director/__init__.py +0 -0
- lionagi/lions/judge/__init__.py +0 -0
- lionagi/lions/judge/config.py +0 -8
- lionagi/lions/judge/data/__init__.py +0 -0
- lionagi/lions/judge/data/sample_codes.py +0 -526
- lionagi/lions/judge/data/sample_rurbic.py +0 -48
- lionagi/lions/judge/forms/__init__.py +0 -0
- lionagi/lions/judge/forms/code_analysis_form.py +0 -126
- lionagi/lions/judge/rubric.py +0 -34
- lionagi/lions/judge/services/__init__.py +0 -0
- lionagi/lions/judge/services/judge_code.py +0 -49
- lionagi/lions/researcher/__init__.py +0 -0
- lionagi/lions/researcher/data_source/__init__.py +0 -0
- lionagi/lions/researcher/data_source/finhub_.py +0 -192
- lionagi/lions/researcher/data_source/google_.py +0 -207
- lionagi/lions/researcher/data_source/wiki_.py +0 -98
- lionagi/lions/researcher/data_source/yfinance_.py +0 -21
- lionagi/operations/brainstorm.py +0 -87
- lionagi/operations/config.py +0 -6
- lionagi/operations/rank.py +0 -102
- lionagi/operations/score.py +0 -144
- lionagi/operations/select.py +0 -141
- lionagi-0.4.0.dist-info/METADATA +0 -241
- lionagi-0.4.0.dist-info/RECORD +0 -249
- /lionagi/{core/_setting → integrations/anthropic_/api_endpoints/messages/response}/__init__.py +0 -0
- /lionagi/{core/agent → integrations/groq_/api_endpoints}/__init__.py +0 -0
- /lionagi/{core/agent/eval → integrations/ollama_/api_endpoints/completion}/__init__.py +0 -0
- /lionagi/{core/agent/learn → integrations/ollama_/api_endpoints/embedding}/__init__.py +0 -0
- /lionagi/{core/agent/plan → integrations/openai_}/__init__.py +0 -0
- /lionagi/{core/director → integrations/openai_/api_endpoints/chat_completions/response}/__init__.py +0 -0
- /lionagi/{core/director/operations → integrations/openai_/image_token_calculator}/__init__.py +0 -0
- /lionagi/{core/engine → integrations/perplexity_/api_endpoints}/__init__.py +0 -0
- /lionagi/{core/executor → integrations/perplexity_/api_endpoints/chat_completions}/__init__.py +0 -0
- /lionagi/{core/generic/registry/component_registry → integrations/perplexity_/api_endpoints/chat_completions/request}/__init__.py +0 -0
- /lionagi/{core/rule → integrations/perplexity_/api_endpoints/chat_completions/response}/__init__.py +0 -0
- /lionagi/{core/unit/template → libs/compress}/__init__.py +0 -0
- /lionagi/{core/validator → libs/file}/__init__.py +0 -0
- /lionagi/{core/work → libs/func}/__init__.py +0 -0
- /lionagi/{experimental → libs/package}/__init__.py +0 -0
- /lionagi/{core/agent/plan/plan.py → libs/parse/params.py} +0 -0
- /lionagi/{experimental/compressor → protocols}/__init__.py +0 -0
- /lionagi/{experimental/directive/parser → protocols/adapters}/__init__.py +0 -0
- /lionagi/{experimental/directive/template → protocols/registries}/__init__.py +0 -0
- /lionagi/{experimental/evaluator → strategies}/__init__.py +0 -0
- {lionagi-0.4.0.dist-info → lionagi-0.5.0.dist-info/licenses}/LICENSE +0 -0
@@ -0,0 +1,212 @@
|
|
1
|
+
from collections.abc import Callable
|
2
|
+
from pathlib import Path
|
3
|
+
from typing import Any, Literal
|
4
|
+
|
5
|
+
from pydantic import BaseModel, Field
|
6
|
+
|
7
|
+
|
8
|
+
class ChunkContentParams(BaseModel):
|
9
|
+
"""Parameters for chunking text content into smaller pieces.
|
10
|
+
|
11
|
+
This model defines parameters used by the chunk_content function to split text
|
12
|
+
content into chunks, with support for both character-based and token-based chunking.
|
13
|
+
"""
|
14
|
+
|
15
|
+
content: str = Field(description="The text content to be chunked")
|
16
|
+
chunk_by: Literal["chars", "tokens"] = Field(
|
17
|
+
default="chars",
|
18
|
+
description="Method to use for chunking: 'chars' for character-based or 'tokens' for token-based",
|
19
|
+
)
|
20
|
+
tokenizer: Callable[[str], list[str]] | None = Field(
|
21
|
+
default=None,
|
22
|
+
description="Function to use for tokenization. Defaults to str.split if None",
|
23
|
+
)
|
24
|
+
chunk_size: int = Field(
|
25
|
+
default=1024, ge=1, description="Target size for each chunk"
|
26
|
+
)
|
27
|
+
overlap: float = Field(
|
28
|
+
default=0.0,
|
29
|
+
ge=0.0,
|
30
|
+
le=1.0,
|
31
|
+
description="Fraction of overlap between chunks (0.0 to 1.0)",
|
32
|
+
)
|
33
|
+
threshold: int = Field(
|
34
|
+
default=256,
|
35
|
+
ge=0,
|
36
|
+
description="Minimum size threshold for the last chunk",
|
37
|
+
)
|
38
|
+
metadata: dict[str, Any] = Field(
|
39
|
+
default_factory=dict,
|
40
|
+
description="Additional metadata to include with each chunk",
|
41
|
+
)
|
42
|
+
return_tokens: bool = Field(
|
43
|
+
default=False,
|
44
|
+
description="If True, return chunks as token lists; if False, return as joined strings",
|
45
|
+
)
|
46
|
+
|
47
|
+
|
48
|
+
class CreatePathParams(BaseModel):
|
49
|
+
"""Parameters for creating file paths with various options.
|
50
|
+
|
51
|
+
This model defines parameters used by the create_path function to generate
|
52
|
+
file paths with support for timestamps, random hashes, and existence checks.
|
53
|
+
"""
|
54
|
+
|
55
|
+
directory: Path | str = Field(
|
56
|
+
description="Directory where the file will be created"
|
57
|
+
)
|
58
|
+
filename: str = Field(description="Base name of the file to create")
|
59
|
+
extension: str | None = Field(
|
60
|
+
default=None,
|
61
|
+
description="File extension (with or without leading dot)",
|
62
|
+
)
|
63
|
+
timestamp: bool = Field(
|
64
|
+
default=False, description="If True, adds a timestamp to the filename"
|
65
|
+
)
|
66
|
+
dir_exist_ok: bool = Field(
|
67
|
+
default=True,
|
68
|
+
description="If True, doesn't raise an error if the directory exists",
|
69
|
+
)
|
70
|
+
file_exist_ok: bool = Field(
|
71
|
+
default=False,
|
72
|
+
description="If True, allows overwriting of existing files",
|
73
|
+
)
|
74
|
+
time_prefix: bool = Field(
|
75
|
+
default=False,
|
76
|
+
description="If True, adds timestamp as prefix instead of suffix",
|
77
|
+
)
|
78
|
+
timestamp_format: str | None = Field(
|
79
|
+
default=None,
|
80
|
+
description="Custom format for the timestamp (strftime format)",
|
81
|
+
)
|
82
|
+
random_hash_digits: int = Field(
|
83
|
+
default=0,
|
84
|
+
ge=0,
|
85
|
+
description="Number of random hash digits to append to filename",
|
86
|
+
)
|
87
|
+
|
88
|
+
|
89
|
+
class DirToFilesParams(BaseModel):
|
90
|
+
"""Parameters for processing directories and collecting file paths.
|
91
|
+
|
92
|
+
This model defines parameters used by the dir_to_files function to recursively
|
93
|
+
process directories and collect matching file paths.
|
94
|
+
"""
|
95
|
+
|
96
|
+
directory: Path | str = Field(
|
97
|
+
description="Directory to process recursively"
|
98
|
+
)
|
99
|
+
file_types: list[str] | None = Field(
|
100
|
+
default=None,
|
101
|
+
description="List of file extensions to include (e.g., ['.txt', '.pdf']). If None, includes all types",
|
102
|
+
)
|
103
|
+
max_workers: int | None = Field(
|
104
|
+
default=None,
|
105
|
+
description="Maximum number of worker threads for concurrent processing",
|
106
|
+
)
|
107
|
+
ignore_errors: bool = Field(
|
108
|
+
default=False,
|
109
|
+
description="If True, log warnings for errors instead of raising exceptions",
|
110
|
+
)
|
111
|
+
verbose: bool = Field(
|
112
|
+
default=False,
|
113
|
+
description="If True, print verbose output during processing",
|
114
|
+
)
|
115
|
+
|
116
|
+
|
117
|
+
class FileToChunksParams(BaseModel):
|
118
|
+
"""Parameters for splitting file content into chunks.
|
119
|
+
|
120
|
+
This model defines parameters used by the file_to_chunks function to read
|
121
|
+
and split file content into chunks with metadata.
|
122
|
+
"""
|
123
|
+
|
124
|
+
file_path: Path | str = Field(
|
125
|
+
description="Path to the file to be processed"
|
126
|
+
)
|
127
|
+
chunk_func: Callable[[str, int, float, int], list[str]] = Field(
|
128
|
+
description="Function to use for chunking the content"
|
129
|
+
)
|
130
|
+
chunk_size: int = Field(
|
131
|
+
default=1500, ge=1, description="Target size for each chunk"
|
132
|
+
)
|
133
|
+
overlap: float = Field(
|
134
|
+
default=0.1,
|
135
|
+
ge=0.0,
|
136
|
+
le=1.0,
|
137
|
+
description="Fraction of overlap between chunks (0.0 to 1.0)",
|
138
|
+
)
|
139
|
+
threshold: int = Field(
|
140
|
+
default=200,
|
141
|
+
ge=0,
|
142
|
+
description="Minimum size threshold for the last chunk",
|
143
|
+
)
|
144
|
+
encoding: str = Field(
|
145
|
+
default="utf-8",
|
146
|
+
description="File encoding to use when reading the file",
|
147
|
+
)
|
148
|
+
custom_metadata: dict[str, Any] | None = Field(
|
149
|
+
default=None,
|
150
|
+
description="Additional metadata to include with each chunk",
|
151
|
+
)
|
152
|
+
output_dir: Path | str | None = Field(
|
153
|
+
default=None,
|
154
|
+
description="Directory to save output chunks (if provided)",
|
155
|
+
)
|
156
|
+
verbose: bool = Field(
|
157
|
+
default=False,
|
158
|
+
description="If True, print verbose output during processing",
|
159
|
+
)
|
160
|
+
timestamp: bool = Field(
|
161
|
+
default=True,
|
162
|
+
description="If True, include timestamp in output filenames",
|
163
|
+
)
|
164
|
+
random_hash_digits: int = Field(
|
165
|
+
default=4,
|
166
|
+
ge=0,
|
167
|
+
description="Number of random hash digits to include in output filenames",
|
168
|
+
)
|
169
|
+
|
170
|
+
|
171
|
+
class SaveToFileParams(BaseModel):
|
172
|
+
"""Parameters for saving text content to a file.
|
173
|
+
|
174
|
+
This model defines parameters used by the save_to_file function to save
|
175
|
+
text content to a file with various options for naming and handling.
|
176
|
+
"""
|
177
|
+
|
178
|
+
text: str = Field(description="The text content to save to file")
|
179
|
+
directory: Path | str = Field(
|
180
|
+
description="Directory where the file will be saved"
|
181
|
+
)
|
182
|
+
filename: str = Field(description="Name of the file to create")
|
183
|
+
extension: str | None = Field(
|
184
|
+
default=None,
|
185
|
+
description="File extension (with or without leading dot)",
|
186
|
+
)
|
187
|
+
timestamp: bool = Field(
|
188
|
+
default=False, description="If True, append timestamp to filename"
|
189
|
+
)
|
190
|
+
dir_exist_ok: bool = Field(
|
191
|
+
default=True,
|
192
|
+
description="If True, creates directory if it doesn't exist",
|
193
|
+
)
|
194
|
+
file_exist_ok: bool = Field(
|
195
|
+
default=False, description="If True, allows overwriting existing files"
|
196
|
+
)
|
197
|
+
time_prefix: bool = Field(
|
198
|
+
default=False,
|
199
|
+
description="If True, prepend timestamp instead of append",
|
200
|
+
)
|
201
|
+
timestamp_format: str | None = Field(
|
202
|
+
default=None,
|
203
|
+
description="Custom format for timestamp (strftime format)",
|
204
|
+
)
|
205
|
+
random_hash_digits: int = Field(
|
206
|
+
default=0,
|
207
|
+
ge=0,
|
208
|
+
description="Number of random hash digits to append to filename",
|
209
|
+
)
|
210
|
+
verbose: bool = Field(
|
211
|
+
default=True, description="If True, logs the file path after saving"
|
212
|
+
)
|
@@ -0,0 +1,301 @@
|
|
1
|
+
import logging
|
2
|
+
import re
|
3
|
+
import sys
|
4
|
+
from datetime import datetime
|
5
|
+
from pathlib import Path
|
6
|
+
from typing import Any
|
7
|
+
|
8
|
+
from ..utils import unique_hash
|
9
|
+
|
10
|
+
|
11
|
+
def create_path(
|
12
|
+
directory: Path | str,
|
13
|
+
filename: str,
|
14
|
+
extension: str = None,
|
15
|
+
timestamp: bool = False,
|
16
|
+
dir_exist_ok: bool = True,
|
17
|
+
file_exist_ok: bool = False,
|
18
|
+
time_prefix: bool = False,
|
19
|
+
timestamp_format: str | None = None,
|
20
|
+
random_hash_digits: int = 0,
|
21
|
+
) -> Path:
|
22
|
+
"""
|
23
|
+
Generate a new file path with optional timestamp and random hash.
|
24
|
+
|
25
|
+
Args:
|
26
|
+
directory: The directory where the file will be created.
|
27
|
+
filename: The base name of the file to create.
|
28
|
+
timestamp: If True, adds a timestamp to the filename.
|
29
|
+
dir_exist_ok: If True, doesn't raise an error if the directory
|
30
|
+
exists.
|
31
|
+
file_exist_ok: If True, allows overwriting of existing files.
|
32
|
+
time_prefix: If True, adds the timestamp as a prefix instead of
|
33
|
+
a suffix.
|
34
|
+
timestamp_format: Custom format for the timestamp.
|
35
|
+
random_hash_digits: Number of digits for the random hash.
|
36
|
+
|
37
|
+
Returns:
|
38
|
+
The full path to the new or existing file.
|
39
|
+
|
40
|
+
Raises:
|
41
|
+
ValueError: If the filename contains illegal characters.
|
42
|
+
FileExistsError: If the file exists and file_exist_ok is False.
|
43
|
+
"""
|
44
|
+
if "/" in filename or "\\" in filename:
|
45
|
+
raise ValueError("Filename cannot contain directory separators.")
|
46
|
+
directory = Path(directory)
|
47
|
+
|
48
|
+
name, ext = None, None
|
49
|
+
if "." in filename:
|
50
|
+
name, ext = filename.rsplit(".", 1)
|
51
|
+
else:
|
52
|
+
name = filename
|
53
|
+
ext = extension.strip(".").strip() if extension else None
|
54
|
+
|
55
|
+
if not ext:
|
56
|
+
raise ValueError("No extension provided for filename.")
|
57
|
+
|
58
|
+
ext = f".{ext}" if ext else ""
|
59
|
+
|
60
|
+
if timestamp:
|
61
|
+
timestamp_str = datetime.now().strftime(
|
62
|
+
timestamp_format or "%Y%m%d%H%M%S"
|
63
|
+
)
|
64
|
+
name = (
|
65
|
+
f"{timestamp_str}_{name}"
|
66
|
+
if time_prefix
|
67
|
+
else f"{name}_{timestamp_str}"
|
68
|
+
)
|
69
|
+
|
70
|
+
if random_hash_digits > 0:
|
71
|
+
random_hash = "-" + unique_hash(random_hash_digits)
|
72
|
+
name = f"{name}{random_hash}"
|
73
|
+
|
74
|
+
full_filename = f"{name}{ext}"
|
75
|
+
full_path = directory / full_filename
|
76
|
+
|
77
|
+
if full_path.exists():
|
78
|
+
if file_exist_ok:
|
79
|
+
return full_path
|
80
|
+
raise FileExistsError(
|
81
|
+
f"File {full_path} already exists and file_exist_ok is False."
|
82
|
+
)
|
83
|
+
full_path.parent.mkdir(parents=True, exist_ok=dir_exist_ok)
|
84
|
+
return full_path
|
85
|
+
|
86
|
+
|
87
|
+
def is_valid_path(
|
88
|
+
path: str | Path,
|
89
|
+
*,
|
90
|
+
max_length: int | None = None,
|
91
|
+
allow_relative: bool = True,
|
92
|
+
allow_symlinks: bool = True,
|
93
|
+
custom_reserved_names: list[str] | None = None,
|
94
|
+
strict_mode: bool = False,
|
95
|
+
) -> bool:
|
96
|
+
"""
|
97
|
+
Validates whether the given path is syntactically valid for the current operating system.
|
98
|
+
|
99
|
+
Args:
|
100
|
+
path (Union[str, Path]): The filesystem path to validate.
|
101
|
+
max_length (Optional[int]): Maximum allowed path length. If None, uses OS default.
|
102
|
+
allow_relative (bool): Whether to allow relative paths. Default is True.
|
103
|
+
allow_symlinks (bool): Whether to allow symlinks. Default is True.
|
104
|
+
custom_reserved_names (Optional[List[str]]): Additional reserved names to check.
|
105
|
+
strict_mode (bool): If True, applies stricter validation rules. Default is False.
|
106
|
+
|
107
|
+
Returns:
|
108
|
+
bool: True if the path is valid, False otherwise.
|
109
|
+
|
110
|
+
Raises:
|
111
|
+
ValueError: If the path is invalid, with a detailed explanation.
|
112
|
+
"""
|
113
|
+
if isinstance(path, Path):
|
114
|
+
path_str = str(path)
|
115
|
+
elif isinstance(path, str):
|
116
|
+
path_str = path
|
117
|
+
else:
|
118
|
+
raise TypeError("Path must be a string or Path object.")
|
119
|
+
|
120
|
+
if not path_str:
|
121
|
+
raise ValueError("Path cannot be an empty string.")
|
122
|
+
|
123
|
+
issues = []
|
124
|
+
is_windows = sys.platform.startswith("win")
|
125
|
+
|
126
|
+
# Common checks for both Windows and Unix-like systems
|
127
|
+
if "\0" in path_str:
|
128
|
+
issues.append("Path contains null character.")
|
129
|
+
|
130
|
+
if not max_length:
|
131
|
+
max_length = 260 if is_windows else 4096
|
132
|
+
if len(path_str) > max_length:
|
133
|
+
issues.append(
|
134
|
+
f"Path exceeds the maximum length of {max_length} characters."
|
135
|
+
)
|
136
|
+
|
137
|
+
if is_windows:
|
138
|
+
# Windows-specific validation
|
139
|
+
invalid_chars = r'<>:"/\\|?*'
|
140
|
+
if re.search(f"[{re.escape(invalid_chars)}]", path_str):
|
141
|
+
issues.append(f"Path contains invalid characters: {invalid_chars}")
|
142
|
+
|
143
|
+
reserved_names = {
|
144
|
+
"CON",
|
145
|
+
"PRN",
|
146
|
+
"AUX",
|
147
|
+
"NUL",
|
148
|
+
"COM1",
|
149
|
+
"COM2",
|
150
|
+
"COM3",
|
151
|
+
"COM4",
|
152
|
+
"COM5",
|
153
|
+
"COM6",
|
154
|
+
"COM7",
|
155
|
+
"COM8",
|
156
|
+
"COM9",
|
157
|
+
"LPT1",
|
158
|
+
"LPT2",
|
159
|
+
"LPT3",
|
160
|
+
"LPT4",
|
161
|
+
"LPT5",
|
162
|
+
"LPT6",
|
163
|
+
"LPT7",
|
164
|
+
"LPT8",
|
165
|
+
"LPT9",
|
166
|
+
}
|
167
|
+
if custom_reserved_names:
|
168
|
+
reserved_names.update(custom_reserved_names)
|
169
|
+
|
170
|
+
path = Path(path_str)
|
171
|
+
for part in path.parts:
|
172
|
+
name = part.upper().rstrip(". ")
|
173
|
+
if name in reserved_names:
|
174
|
+
issues.append(f"Path contains a reserved name: '{part}'")
|
175
|
+
|
176
|
+
if path_str.endswith(" ") or path_str.endswith("."):
|
177
|
+
issues.append(
|
178
|
+
"Path cannot end with a space or a period on Windows."
|
179
|
+
)
|
180
|
+
|
181
|
+
if strict_mode:
|
182
|
+
if not path_str.startswith("\\\\?\\") and len(path_str) > 260:
|
183
|
+
issues.append(
|
184
|
+
"Path exceeds 260 characters without long path prefix."
|
185
|
+
)
|
186
|
+
|
187
|
+
else:
|
188
|
+
# Unix-like systems validation
|
189
|
+
if strict_mode:
|
190
|
+
if re.search(r"//+", path_str):
|
191
|
+
issues.append("Path contains consecutive slashes.")
|
192
|
+
|
193
|
+
if not allow_relative and not path_str.startswith("/"):
|
194
|
+
issues.append("Relative paths are not allowed.")
|
195
|
+
|
196
|
+
# Common additional checks
|
197
|
+
if not allow_symlinks and Path(path_str).is_symlink():
|
198
|
+
issues.append("Symlinks are not allowed.")
|
199
|
+
|
200
|
+
if strict_mode:
|
201
|
+
if re.search(r"\s", path_str):
|
202
|
+
issues.append("Path contains whitespace characters.")
|
203
|
+
|
204
|
+
if issues:
|
205
|
+
raise ValueError("Invalid path: " + "; ".join(issues))
|
206
|
+
|
207
|
+
return True
|
208
|
+
|
209
|
+
|
210
|
+
def split_path(path: Path | str) -> tuple[Path, str]:
|
211
|
+
"""
|
212
|
+
Split a path into its directory and filename components.
|
213
|
+
|
214
|
+
Args:
|
215
|
+
path: The path to split.
|
216
|
+
|
217
|
+
Returns:
|
218
|
+
A tuple containing the directory and filename.
|
219
|
+
"""
|
220
|
+
path = Path(path)
|
221
|
+
return path.parent, path.name
|
222
|
+
|
223
|
+
|
224
|
+
def _get_path_kwargs(
|
225
|
+
persist_path: str | Path, postfix: str, **path_kwargs: Any
|
226
|
+
) -> dict[str, Any]:
|
227
|
+
"""
|
228
|
+
Generate keyword arguments for path creation.
|
229
|
+
|
230
|
+
Args:
|
231
|
+
persist_path: The base path to use.
|
232
|
+
postfix: The file extension to use.
|
233
|
+
**path_kwargs: Additional keyword arguments to override defaults.
|
234
|
+
|
235
|
+
Returns:
|
236
|
+
A dictionary of keyword arguments for path creation.
|
237
|
+
"""
|
238
|
+
persist_path = Path(persist_path)
|
239
|
+
postfix = f".{postfix.strip('.')}"
|
240
|
+
|
241
|
+
if persist_path.suffix != postfix:
|
242
|
+
dirname = persist_path
|
243
|
+
filename = f"new_file{postfix}"
|
244
|
+
else:
|
245
|
+
dirname, filename = persist_path.parent, persist_path.name
|
246
|
+
|
247
|
+
return {
|
248
|
+
"timestamp": path_kwargs.get("timestamp", False),
|
249
|
+
"file_exist_ok": path_kwargs.get("file_exist_ok", True),
|
250
|
+
"directory": path_kwargs.get("directory", dirname),
|
251
|
+
"filename": path_kwargs.get("filename", filename),
|
252
|
+
}
|
253
|
+
|
254
|
+
|
255
|
+
def clear_path(
|
256
|
+
path: Path | str,
|
257
|
+
/,
|
258
|
+
recursive: bool = False,
|
259
|
+
exclude: list[str] | None = None,
|
260
|
+
) -> None:
|
261
|
+
"""
|
262
|
+
Clear all files and directories in the specified path.
|
263
|
+
|
264
|
+
Args:
|
265
|
+
path: The path to the directory to clear.
|
266
|
+
recursive: If True, clears directories recursively.
|
267
|
+
exclude: A list of string patterns to exclude from deletion.
|
268
|
+
|
269
|
+
Raises:
|
270
|
+
FileNotFoundError: If the specified directory does not exist.
|
271
|
+
PermissionError: If there are insufficient permissions to delete
|
272
|
+
files.
|
273
|
+
"""
|
274
|
+
path = Path(path)
|
275
|
+
if not path.exists():
|
276
|
+
raise FileNotFoundError(
|
277
|
+
f"The specified directory {path} does not exist."
|
278
|
+
)
|
279
|
+
|
280
|
+
exclude = exclude or []
|
281
|
+
exclude_pattern = re.compile("|".join(exclude)) if exclude else None
|
282
|
+
|
283
|
+
for file_path in path.iterdir():
|
284
|
+
if exclude_pattern and exclude_pattern.search(file_path.name):
|
285
|
+
logging.info(f"Excluded from deletion: {file_path}")
|
286
|
+
continue
|
287
|
+
|
288
|
+
try:
|
289
|
+
if file_path.is_dir():
|
290
|
+
if recursive:
|
291
|
+
clear_path(file_path, recursive=True, exclude=exclude)
|
292
|
+
file_path.rmdir()
|
293
|
+
else:
|
294
|
+
continue
|
295
|
+
else:
|
296
|
+
file_path.unlink()
|
297
|
+
logging.info(f"Successfully deleted {file_path}")
|
298
|
+
except PermissionError as e:
|
299
|
+
logging.error(f"Permission denied when deleting {file_path}: {e}")
|
300
|
+
except Exception as e:
|
301
|
+
logging.error(f"Failed to delete {file_path}: {e}")
|
@@ -0,0 +1,139 @@
|
|
1
|
+
import logging
|
2
|
+
from collections.abc import Callable
|
3
|
+
from concurrent.futures import ThreadPoolExecutor, as_completed
|
4
|
+
from pathlib import Path
|
5
|
+
from typing import Any
|
6
|
+
|
7
|
+
from .chunk import chunk_content
|
8
|
+
from .save import save_chunks
|
9
|
+
|
10
|
+
|
11
|
+
def dir_to_files(
|
12
|
+
directory: str | Path,
|
13
|
+
file_types: list[str] | None = None,
|
14
|
+
max_workers: int | None = None,
|
15
|
+
ignore_errors: bool = False,
|
16
|
+
verbose: bool = False,
|
17
|
+
) -> list[Path]:
|
18
|
+
"""
|
19
|
+
Recursively process a directory and return a list of file paths.
|
20
|
+
|
21
|
+
This function walks through the given directory and its subdirectories,
|
22
|
+
collecting file paths that match the specified file types (if any).
|
23
|
+
|
24
|
+
Args:
|
25
|
+
directory (Union[str, Path]): The directory to process.
|
26
|
+
file_types (Optional[List[str]]): List of file extensions to include (e.g., ['.txt', '.pdf']).
|
27
|
+
If None, include all file types.
|
28
|
+
max_workers (Optional[int]): Maximum number of worker threads for concurrent processing.
|
29
|
+
If None, uses the default ThreadPoolExecutor behavior.
|
30
|
+
ignore_errors (bool): If True, log warnings for errors instead of raising exceptions.
|
31
|
+
verbose (bool): If True, print verbose output.
|
32
|
+
|
33
|
+
Returns:
|
34
|
+
List[Path]: A list of Path objects representing the files found.
|
35
|
+
|
36
|
+
Raises:
|
37
|
+
ValueError: If the provided directory doesn't exist or isn't a directory.
|
38
|
+
"""
|
39
|
+
directory_path = Path(directory)
|
40
|
+
if not directory_path.is_dir():
|
41
|
+
raise ValueError(
|
42
|
+
f"The provided path is not a valid directory: {directory}"
|
43
|
+
)
|
44
|
+
|
45
|
+
def process_file(file_path: Path) -> Path | None:
|
46
|
+
try:
|
47
|
+
if file_types is None or file_path.suffix in file_types:
|
48
|
+
return file_path
|
49
|
+
except Exception as e:
|
50
|
+
if ignore_errors:
|
51
|
+
if verbose:
|
52
|
+
logging.warning(f"Error processing {file_path}: {e}")
|
53
|
+
else:
|
54
|
+
raise ValueError(f"Error processing {file_path}: {e}") from e
|
55
|
+
return None
|
56
|
+
|
57
|
+
try:
|
58
|
+
with ThreadPoolExecutor(max_workers=max_workers) as executor:
|
59
|
+
futures = [
|
60
|
+
executor.submit(process_file, f)
|
61
|
+
for f in directory_path.rglob("*")
|
62
|
+
if f.is_file()
|
63
|
+
]
|
64
|
+
files = [
|
65
|
+
future.result()
|
66
|
+
for future in as_completed(futures)
|
67
|
+
if future.result() is not None
|
68
|
+
]
|
69
|
+
|
70
|
+
if verbose:
|
71
|
+
logging.info(f"Processed {len(files)} files from {directory}")
|
72
|
+
|
73
|
+
return files
|
74
|
+
except Exception as e:
|
75
|
+
raise ValueError(f"Error processing directory {directory}: {e}") from e
|
76
|
+
|
77
|
+
|
78
|
+
def file_to_chunks(
|
79
|
+
file_path: str | Path,
|
80
|
+
chunk_func: Callable[[str, int, float, int], list[str]],
|
81
|
+
chunk_size: int = 1500,
|
82
|
+
overlap: float = 0.1,
|
83
|
+
threshold: int = 200,
|
84
|
+
encoding: str = "utf-8",
|
85
|
+
custom_metadata: dict[str, Any] | None = None,
|
86
|
+
output_dir: str | Path | None = None,
|
87
|
+
verbose: bool = False,
|
88
|
+
timestamp: bool = True,
|
89
|
+
random_hash_digits: int = 4,
|
90
|
+
) -> list[dict[str, Any]]:
|
91
|
+
"""
|
92
|
+
Process a file and split its content into chunks.
|
93
|
+
|
94
|
+
This function reads a file, splits its content into chunks using the provided
|
95
|
+
chunking function, and optionally saves the chunks to separate files.
|
96
|
+
|
97
|
+
Args:
|
98
|
+
file_path (Union[str, Path]): Path to the file to be processed.
|
99
|
+
chunk_func (Callable): Function to use for chunking the content.
|
100
|
+
chunk_size (int): The target size for each chunk.
|
101
|
+
overlap (float): The fraction of overlap between chunks.
|
102
|
+
threshold (int): The minimum size for the last chunk.
|
103
|
+
encoding (str): File encoding to use when reading the file.
|
104
|
+
custom_metadata (Optional[Dict[str, Any]]): Additional metadata to include with each chunk.
|
105
|
+
output_dir (Optional[Union[str, Path]]): Directory to save output chunks (if provided).
|
106
|
+
verbose (bool): If True, print verbose output.
|
107
|
+
timestamp (bool): If True, include timestamp in output filenames.
|
108
|
+
random_hash_digits (int): Number of random hash digits to include in output filenames.
|
109
|
+
|
110
|
+
Returns:
|
111
|
+
List[Dict[str, Any]]: A list of dictionaries, each representing a chunk with metadata.
|
112
|
+
|
113
|
+
Raises:
|
114
|
+
ValueError: If there's an error processing the file.
|
115
|
+
"""
|
116
|
+
try:
|
117
|
+
file_path = Path(file_path)
|
118
|
+
with open(file_path, encoding=encoding) as f:
|
119
|
+
content = f.read()
|
120
|
+
|
121
|
+
metadata = {
|
122
|
+
"file_path": str(file_path),
|
123
|
+
"file_name": file_path.name,
|
124
|
+
"file_size": file_path.stat().st_size,
|
125
|
+
**(custom_metadata or {}),
|
126
|
+
}
|
127
|
+
|
128
|
+
chunks = chunk_content(
|
129
|
+
content, chunk_func, chunk_size, overlap, threshold, metadata
|
130
|
+
)
|
131
|
+
|
132
|
+
if output_dir:
|
133
|
+
save_chunks(
|
134
|
+
chunks, output_dir, verbose, timestamp, random_hash_digits
|
135
|
+
)
|
136
|
+
|
137
|
+
return chunks
|
138
|
+
except Exception as e:
|
139
|
+
raise ValueError(f"Error processing file {file_path}: {e}") from e
|