PyPI - waldiez - Versions diffs - 0.4.7__py3-none-any.whl → 0.4.8__py3-none-any.whl - Mend

waldiez 0.4.7py3-none-any.whl → 0.4.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of waldiez might be problematic. Click here for more details.

Files changed (244) hide show

waldiez/__init__.py +5 -5
waldiez/_version.py +1 -1
waldiez/cli.py +112 -73
waldiez/exporter.py +61 -19
waldiez/exporting/__init__.py +25 -6
waldiez/exporting/agent/__init__.py +7 -3
waldiez/exporting/agent/code_execution.py +114 -0
waldiez/exporting/agent/exporter.py +354 -0
waldiez/exporting/agent/extras/__init__.py +15 -0
waldiez/exporting/agent/extras/captain_agent_extras.py +315 -0
waldiez/exporting/agent/extras/group/target.py +178 -0
waldiez/exporting/agent/extras/group_manager_agent_extas.py +500 -0
waldiez/exporting/agent/extras/group_member_extras.py +181 -0
waldiez/exporting/agent/extras/handoffs/__init__.py +19 -0
waldiez/exporting/agent/extras/handoffs/after_work.py +78 -0
waldiez/exporting/agent/extras/handoffs/available.py +74 -0
waldiez/exporting/agent/extras/handoffs/condition.py +158 -0
waldiez/exporting/agent/extras/handoffs/handoff.py +171 -0
waldiez/exporting/agent/extras/handoffs/target.py +189 -0
waldiez/exporting/agent/extras/rag/__init__.py +10 -0
waldiez/exporting/agent/{utils/rag_user/chroma_utils.py → extras/rag/chroma_extras.py} +16 -15
waldiez/exporting/agent/{utils/rag_user/mongo_utils.py → extras/rag/mongo_extras.py} +10 -10
waldiez/exporting/agent/{utils/rag_user/pgvector_utils.py → extras/rag/pgvector_extras.py} +13 -13
waldiez/exporting/agent/{utils/rag_user/qdrant_utils.py → extras/rag/qdrant_extras.py} +13 -13
waldiez/exporting/agent/{utils/rag_user/vector_db.py → extras/rag/vector_db_extras.py} +59 -46
waldiez/exporting/agent/extras/rag_user_proxy_agent_extras.py +245 -0
waldiez/exporting/agent/extras/reasoning_agent_extras.py +88 -0
waldiez/exporting/agent/factory.py +95 -0
waldiez/exporting/agent/processor.py +150 -0
waldiez/exporting/agent/system_message.py +36 -0
waldiez/exporting/agent/termination.py +50 -0
waldiez/exporting/chats/__init__.py +7 -3
waldiez/exporting/chats/exporter.py +97 -0
waldiez/exporting/chats/factory.py +65 -0
waldiez/exporting/chats/processor.py +226 -0
waldiez/exporting/chats/utils/__init__.py +6 -5
waldiez/exporting/chats/utils/common.py +11 -45
waldiez/exporting/chats/utils/group.py +55 -0
waldiez/exporting/chats/utils/nested.py +37 -52
waldiez/exporting/chats/utils/sequential.py +72 -61
waldiez/exporting/chats/utils/{single_chat.py → single.py} +48 -50
waldiez/exporting/core/__init__.py +196 -0
waldiez/exporting/core/constants.py +17 -0
waldiez/exporting/core/content.py +69 -0
waldiez/exporting/core/context.py +244 -0
waldiez/exporting/core/enums.py +89 -0
waldiez/exporting/core/errors.py +19 -0
waldiez/exporting/core/exporter.py +390 -0
waldiez/exporting/core/exporters.py +67 -0
waldiez/exporting/core/extras/__init__.py +39 -0
waldiez/exporting/core/extras/agent_extras/__init__.py +27 -0
waldiez/exporting/core/extras/agent_extras/captain_extras.py +57 -0
waldiez/exporting/core/extras/agent_extras/group_manager_extras.py +102 -0
waldiez/exporting/core/extras/agent_extras/rag_user_extras.py +53 -0
waldiez/exporting/core/extras/agent_extras/reasoning_extras.py +68 -0
waldiez/exporting/core/extras/agent_extras/standard_extras.py +263 -0
waldiez/exporting/core/extras/base.py +241 -0
waldiez/exporting/core/extras/chat_extras.py +118 -0
waldiez/exporting/core/extras/flow_extras.py +70 -0
waldiez/exporting/core/extras/model_extras.py +73 -0
waldiez/exporting/core/extras/path_resolver.py +93 -0
waldiez/exporting/core/extras/serializer.py +138 -0
waldiez/exporting/core/extras/tool_extras.py +82 -0
waldiez/exporting/core/protocols.py +259 -0
waldiez/exporting/core/result.py +705 -0
waldiez/exporting/core/types.py +329 -0
waldiez/exporting/core/utils/__init__.py +11 -0
waldiez/exporting/core/utils/comment.py +33 -0
waldiez/exporting/core/utils/llm_config.py +117 -0
waldiez/exporting/core/validation.py +96 -0
waldiez/exporting/flow/__init__.py +6 -2
waldiez/exporting/flow/execution_generator.py +193 -0
waldiez/exporting/flow/exporter.py +107 -0
waldiez/exporting/flow/factory.py +94 -0
waldiez/exporting/flow/file_generator.py +214 -0
waldiez/exporting/flow/merger.py +387 -0
waldiez/exporting/flow/orchestrator.py +411 -0
waldiez/exporting/flow/utils/__init__.py +9 -36
waldiez/exporting/flow/utils/common.py +206 -0
waldiez/exporting/flow/utils/importing.py +373 -0
waldiez/exporting/flow/utils/linting.py +200 -0
waldiez/exporting/flow/utils/{logging_utils.py → logging.py} +23 -9
waldiez/exporting/models/__init__.py +3 -1
waldiez/exporting/models/exporter.py +233 -0
waldiez/exporting/models/factory.py +66 -0
waldiez/exporting/models/processor.py +139 -0
waldiez/exporting/tools/__init__.py +11 -0
waldiez/exporting/tools/exporter.py +207 -0
waldiez/exporting/tools/factory.py +57 -0
waldiez/exporting/tools/processor.py +248 -0
waldiez/exporting/tools/registration.py +133 -0
waldiez/io/__init__.py +128 -0
waldiez/io/_ws.py +199 -0
waldiez/io/models/__init__.py +60 -0
waldiez/io/models/base.py +66 -0
waldiez/io/models/constants.py +78 -0
waldiez/io/models/content/__init__.py +23 -0
waldiez/io/models/content/audio.py +43 -0
waldiez/io/models/content/base.py +45 -0
waldiez/io/models/content/file.py +43 -0
waldiez/io/models/content/image.py +96 -0
waldiez/io/models/content/text.py +37 -0
waldiez/io/models/content/video.py +43 -0
waldiez/io/models/user_input.py +269 -0
waldiez/io/models/user_response.py +215 -0
waldiez/io/mqtt.py +681 -0
waldiez/io/redis.py +782 -0
waldiez/io/structured.py +419 -0
waldiez/io/utils.py +184 -0
waldiez/io/ws.py +298 -0
waldiez/logger.py +481 -0
waldiez/models/__init__.py +108 -51
waldiez/models/agents/__init__.py +34 -70
waldiez/models/agents/agent/__init__.py +10 -4
waldiez/models/agents/agent/agent.py +466 -65
waldiez/models/agents/agent/agent_data.py +119 -47
waldiez/models/agents/agent/agent_type.py +13 -2
waldiez/models/agents/agent/code_execution.py +12 -12
waldiez/models/agents/agent/human_input_mode.py +8 -0
waldiez/models/agents/agent/{linked_skill.py → linked_tool.py} +7 -7
waldiez/models/agents/agent/nested_chat.py +35 -7
waldiez/models/agents/agent/termination_message.py +30 -22
waldiez/models/agents/{swarm_agent → agent}/update_system_message.py +22 -22
waldiez/models/agents/agents.py +58 -63
waldiez/models/agents/assistant/assistant.py +4 -4
waldiez/models/agents/assistant/assistant_data.py +13 -1
waldiez/models/agents/{captain_agent → captain}/captain_agent.py +5 -5
waldiez/models/agents/{captain_agent → captain}/captain_agent_data.py +5 -5
waldiez/models/agents/extra_requirements.py +11 -16
waldiez/models/agents/group_manager/group_manager.py +103 -13
waldiez/models/agents/group_manager/group_manager_data.py +36 -14
waldiez/models/agents/group_manager/speakers.py +77 -24
waldiez/models/agents/{rag_user → rag_user_proxy}/__init__.py +16 -16
waldiez/models/agents/rag_user_proxy/rag_user_proxy.py +64 -0
waldiez/models/agents/{rag_user/rag_user_data.py → rag_user_proxy/rag_user_proxy_data.py} +6 -5
waldiez/models/agents/{rag_user → rag_user_proxy}/retrieve_config.py +182 -114
waldiez/models/agents/{rag_user → rag_user_proxy}/vector_db_config.py +13 -13
waldiez/models/agents/reasoning/reasoning_agent.py +6 -6
waldiez/models/agents/reasoning/reasoning_agent_data.py +110 -63
waldiez/models/agents/reasoning/reasoning_agent_reason_config.py +38 -10
waldiez/models/agents/user_proxy/user_proxy.py +11 -7
waldiez/models/agents/user_proxy/user_proxy_data.py +2 -2
waldiez/models/chat/__init__.py +2 -1
waldiez/models/chat/chat.py +166 -87
waldiez/models/chat/chat_data.py +99 -136
waldiez/models/chat/chat_message.py +33 -23
waldiez/models/chat/chat_nested.py +31 -30
waldiez/models/chat/chat_summary.py +10 -8
waldiez/models/common/__init__.py +52 -2
waldiez/models/common/ag2_version.py +1 -1
waldiez/models/common/base.py +38 -7
waldiez/models/common/dict_utils.py +42 -17
waldiez/models/common/handoff.py +459 -0
waldiez/models/common/id_generator.py +19 -0
waldiez/models/common/method_utils.py +130 -68
waldiez/{exporting/base/utils → models/common}/naming.py +38 -61
waldiez/models/common/waldiez_version.py +37 -0
waldiez/models/flow/__init__.py +9 -2
waldiez/models/flow/connection.py +18 -0
waldiez/models/flow/flow.py +311 -215
waldiez/models/flow/flow_data.py +207 -40
waldiez/models/flow/info.py +85 -0
waldiez/models/flow/naming.py +131 -0
waldiez/models/model/__init__.py +7 -1
waldiez/models/model/extra_requirements.py +3 -12
waldiez/models/model/model.py +76 -21
waldiez/models/model/model_data.py +108 -20
waldiez/models/tool/__init__.py +16 -0
waldiez/models/tool/extra_requirements.py +36 -0
waldiez/models/{skill/skill.py → tool/tool.py} +88 -88
waldiez/models/tool/tool_data.py +51 -0
waldiez/models/tool/tool_type.py +8 -0
waldiez/models/waldiez.py +97 -80
waldiez/runner.py +114 -49
waldiez/running/__init__.py +1 -1
waldiez/running/environment.py +49 -68
waldiez/running/gen_seq_diagram.py +16 -14
waldiez/running/running.py +53 -34
waldiez/utils/__init__.py +0 -4
waldiez/utils/cli_extras/jupyter.py +5 -3
waldiez/utils/cli_extras/runner.py +6 -4
waldiez/utils/cli_extras/studio.py +6 -4
waldiez/utils/conflict_checker.py +15 -9
waldiez/utils/flaml_warnings.py +5 -5
{waldiez-0.4.7.dist-info → waldiez-0.4.8.dist-info}/METADATA +235 -91
waldiez-0.4.8.dist-info/RECORD +200 -0
waldiez/exporting/agent/agent_exporter.py +0 -297
waldiez/exporting/agent/utils/__init__.py +0 -23
waldiez/exporting/agent/utils/captain_agent.py +0 -263
waldiez/exporting/agent/utils/code_execution.py +0 -65
waldiez/exporting/agent/utils/group_manager.py +0 -220
waldiez/exporting/agent/utils/rag_user/__init__.py +0 -7
waldiez/exporting/agent/utils/rag_user/rag_user.py +0 -209
waldiez/exporting/agent/utils/reasoning.py +0 -36
waldiez/exporting/agent/utils/swarm_agent.py +0 -469
waldiez/exporting/agent/utils/teachability.py +0 -41
waldiez/exporting/agent/utils/termination_message.py +0 -44
waldiez/exporting/base/__init__.py +0 -25
waldiez/exporting/base/agent_position.py +0 -75
waldiez/exporting/base/base_exporter.py +0 -118
waldiez/exporting/base/export_position.py +0 -48
waldiez/exporting/base/import_position.py +0 -23
waldiez/exporting/base/mixin.py +0 -137
waldiez/exporting/base/utils/__init__.py +0 -18
waldiez/exporting/base/utils/comments.py +0 -96
waldiez/exporting/base/utils/path_check.py +0 -68
waldiez/exporting/base/utils/to_string.py +0 -84
waldiez/exporting/chats/chats_exporter.py +0 -240
waldiez/exporting/chats/utils/swarm.py +0 -210
waldiez/exporting/flow/flow_exporter.py +0 -528
waldiez/exporting/flow/utils/agent_utils.py +0 -204
waldiez/exporting/flow/utils/chat_utils.py +0 -71
waldiez/exporting/flow/utils/def_main.py +0 -77
waldiez/exporting/flow/utils/flow_content.py +0 -202
waldiez/exporting/flow/utils/flow_names.py +0 -116
waldiez/exporting/flow/utils/importing_utils.py +0 -227
waldiez/exporting/models/models_exporter.py +0 -199
waldiez/exporting/models/utils.py +0 -174
waldiez/exporting/skills/__init__.py +0 -9
waldiez/exporting/skills/skills_exporter.py +0 -176
waldiez/exporting/skills/utils.py +0 -369
waldiez/models/agents/agent/teachability.py +0 -70
waldiez/models/agents/rag_user/rag_user.py +0 -60
waldiez/models/agents/swarm_agent/__init__.py +0 -50
waldiez/models/agents/swarm_agent/after_work.py +0 -179
waldiez/models/agents/swarm_agent/on_condition.py +0 -105
waldiez/models/agents/swarm_agent/on_condition_available.py +0 -142
waldiez/models/agents/swarm_agent/on_condition_target.py +0 -40
waldiez/models/agents/swarm_agent/swarm_agent.py +0 -107
waldiez/models/agents/swarm_agent/swarm_agent_data.py +0 -124
waldiez/models/flow/utils.py +0 -232
waldiez/models/skill/__init__.py +0 -16
waldiez/models/skill/extra_requirements.py +0 -36
waldiez/models/skill/skill_data.py +0 -53
waldiez/models/skill/skill_type.py +0 -8
waldiez/utils/pysqlite3_checker.py +0 -308
waldiez/utils/rdps_checker.py +0 -122
waldiez-0.4.7.dist-info/RECORD +0 -149
/waldiez/models/agents/{captain_agent → captain}/__init__.py +0 -0
/waldiez/models/agents/{captain_agent → captain}/captain_agent_lib_entry.py +0 -0
{waldiez-0.4.7.dist-info → waldiez-0.4.8.dist-info}/WHEEL +0 -0
{waldiez-0.4.7.dist-info → waldiez-0.4.8.dist-info}/entry_points.txt +0 -0
{waldiez-0.4.7.dist-info → waldiez-0.4.8.dist-info}/licenses/LICENSE +0 -0
{waldiez-0.4.7.dist-info → waldiez-0.4.8.dist-info}/licenses/NOTICE.md +0 -0

waldiez/models/agents/{rag_user → rag_user_proxy}/retrieve_config.py RENAMED Viewed

@@ -4,21 +4,21 @@
 import os
 from pathlib import Path
-from typing import Dict, List, Optional, Tuple, Union
+from typing import Optional, Union
 from pydantic import Field, model_validator
 from typing_extensions import Annotated, Literal, Self
 from ...common import WaldiezBase, check_function, generate_function
-from .vector_db_config import WaldiezRagUserVectorDbConfig
+from .vector_db_config import WaldiezRagUserProxyVectorDbConfig
-WaldiezRagUserTask = Literal["code", "qa", "default"]
+WaldiezRagUserProxyTask = Literal["code", "qa", "default"]
 """Possible tasks for the retrieve chat."""
-WaldiezRagUserVectorDb = Literal["chroma", "pgvector", "mongodb", "qdrant"]
+WaldiezRagUserProxyVectorDb = Literal["chroma", "pgvector", "mongodb", "qdrant"]
 """Possible vector dbs for the retrieve chat."""
-WaldiezRagUserChunkMode = Literal["multi_lines", "one_line"]
+WaldiezRagUserProxyChunkMode = Literal["multi_lines", "one_line"]
 """Possible chunk modes for the retrieve chat."""
-WaldiezRagUserModels: Dict[WaldiezRagUserVectorDb, str] = {
+WaldiezRagUserProxyModels: dict[WaldiezRagUserProxyVectorDb, str] = {
     "chroma": "all-MiniLM-L6-v2",
     "mongodb": "all-MiniLM-L6-v2",
     "pgvector": "all-MiniLM-L6-v2",
@@ -26,8 +26,8 @@ WaldiezRagUserModels: Dict[WaldiezRagUserVectorDb, str] = {
 }
 CUSTOM_EMBEDDING_FUNCTION = "custom_embedding_function"
-CUSTOM_EMBEDDING_FUNCTION_ARGS: List[str] = []
-CUSTOM_EMBEDDING_FUNCTION_TYPES: Tuple[List[str], str] = (
+CUSTOM_EMBEDDING_FUNCTION_ARGS: list[str] = []
+CUSTOM_EMBEDDING_FUNCTION_TYPES: tuple[list[str], str] = (
     [],
     "Callable[..., Any]",
 )
@@ -48,7 +48,7 @@ CUSTOM_TEXT_SPLIT_FUNCTION_ARGS = [
 ]
 CUSTOM_TEXT_SPLIT_FUNCTION_TYPES = (
     ["str", "int", "str", "bool", "int"],
-    "List[str]",
+    "list[str]",
 )
 NOT_LOCAL = (
     "http://",
@@ -56,10 +56,14 @@ NOT_LOCAL = (
     "ftp://",
     "ftps://",
     "sftp://",
+    "hdfs",
+    "s3://",
+    "gs://",
+    "azure://",
 )
-class WaldiezRagUserRetrieveConfig(WaldiezBase):
+class WaldiezRagUserProxyRetrieveConfig(WaldiezBase):
     """RAG user agent.
     Attributes
@@ -74,7 +78,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
         The vector db for the retrieve chat.
     db_config : Annotated[WaldiezVectorDbConfig, Field]
         The config for the selected vector db.
-    docs_path : Optional[Union[str, List[str]]]
+    docs_path : Optional[Union[str, list[str]]]
         The path to the docs directory. It can also be the path to a single
         file, the url to a single file or a list of directories, files and
         urls. Default is None, which works only if the collection is already
@@ -147,7 +151,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
         A custom function to split a string into a list of strings. Default is
         None, will use the default function in autogen.retrieve_utils.
         split_text_to_chunks.
-    custom_text_types : Optional[List[str]]
+    custom_text_types : Optional[list[str]]
         A list of file types to be processed. Default is autogen.retrieve_utils.
         TEXT_FORMATS. This only applies to files under the directories in
         docs_path. Explicitly included files and urls will be chunked
@@ -180,9 +184,9 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
     """
     task: Annotated[
-        WaldiezRagUserTask,
+        WaldiezRagUserProxyTask,
         Field(
-            "default",
+            default="default",
             title="Task",
             description=(
                 "The task of the retrieve chat. "
@@ -193,25 +197,25 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "the response."
             ),
         ),
-    ]
+    ] = "default"
     vector_db: Annotated[
-        WaldiezRagUserVectorDb,
+        WaldiezRagUserProxyVectorDb,
         Field(
-            "chroma",
+            default="chroma",
             title="Vector DB",
             description="The vector db for the retrieve chat.",
         ),
-    ]
+    ] = "chroma"
     db_config: Annotated[
-        WaldiezRagUserVectorDbConfig,
+        WaldiezRagUserProxyVectorDbConfig,
         Field(
             title="DB Config",
             description="The config for the selected vector db.",
-            default_factory=WaldiezRagUserVectorDbConfig,
+            default_factory=WaldiezRagUserProxyVectorDbConfig,
         ),
     ]
     docs_path: Annotated[
-        Optional[Union[str, List[str]]],
+        Optional[Union[str, list[str]]],
         Field(
             default=None,
             title="Docs Path",
@@ -222,7 +226,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "only if the collection is already created."
             ),
         ),
-    ]
+    ] = None
     new_docs: Annotated[
         bool,
         Field(
@@ -236,7 +240,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "hash value of the content."
             ),
         ),
-    ]
+    ] = True
     model: Annotated[
         Optional[str],
         Field(
@@ -247,7 +251,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "we check for models linked to the agent."
             ),
         ),
-    ]
+    ] = None
     chunk_token_size: Annotated[
         Optional[int],
         Field(
@@ -259,7 +263,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "will be used."
             ),
         ),
-    ]
+    ] = None
     context_max_tokens: Annotated[
         Optional[int],
         Field(
@@ -271,9 +275,9 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "will be used."
             ),
         ),
-    ]
+    ] = None
     chunk_mode: Annotated[
-        WaldiezRagUserChunkMode,
+        WaldiezRagUserProxyChunkMode,
         Field(
             default="multi_lines",
             title="Chunk Mode",
@@ -283,8 +287,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "a default mode multi_lines will be used."
             ),
         ),
-    ]
+    ] = "multi_lines"
     must_break_at_empty_line: Annotated[
         bool,
         Field(
@@ -295,7 +298,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "If chunk_mode is 'one_line', this parameter will be ignored."
             ),
         ),
-    ]
+    ] = True
     use_custom_embedding: Annotated[
         bool,
         Field(
@@ -307,7 +310,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "provided."
             ),
         ),
-    ]
+    ] = False
     embedding_function: Annotated[
         Optional[str],
         Field(
@@ -322,7 +325,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "https://docs.trychroma.com/guides/embeddings."
             ),
         ),
-    ]
+    ] = None
     customized_prompt: Annotated[
         Optional[str],
         Field(
@@ -332,7 +335,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "The customized prompt for the retrieve chat. Default is None."
             ),
         ),
-    ]
+    ] = None
     customized_answer_prefix: Annotated[
         Optional[str],
         Field(
@@ -344,7 +347,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "not in the answer, Update Context will be triggered."
             ),
         ),
-    ]
+    ] = ""
     update_context: Annotated[
         bool,
         Field(
@@ -355,7 +358,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "retrieval. Default is True."
             ),
         ),
-    ]
+    ] = True
     collection_name: Annotated[
         str,
         Field(
@@ -366,7 +369,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "a default name autogen-docs will be used."
             ),
         ),
-    ]
+    ] = "autogen-docs"
     get_or_create: Annotated[
         bool,
         Field(
@@ -376,7 +379,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "Whether to get the collection if it exists. Default is False."
             ),
         ),
-    ]
+    ] = False
     overwrite: Annotated[
         bool,
         Field(
@@ -394,7 +397,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 " otherwise it raise a ValueError."
             ),
         ),
-    ]
+    ] = False
     use_custom_token_count: Annotated[
         bool,
         Field(
@@ -406,7 +409,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "custom_token_count_function should be provided."
             ),
         ),
-    ]
+    ] = False
     custom_token_count_function: Annotated[
         Optional[str],
         Field(
@@ -421,7 +424,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "tiktoken, which may not be accurate for non-OpenAI models."
             ),
         ),
-    ]
+    ] = None
     use_custom_text_split: Annotated[
         bool,
         Field(
@@ -433,7 +436,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "custom_text_split_function should be provided."
             ),
         ),
-    ]
+    ] = False
     custom_text_split_function: Annotated[
         Optional[str],
         Field(
@@ -445,9 +448,9 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "autogen.retrieve_utils.split_text_to_chunks."
             ),
         ),
-    ]
+    ] = None
     custom_text_types: Annotated[
-        Optional[List[str]],
+        Optional[list[str]],
         Field(
             default=None,
             title="Custom Text Types",
@@ -459,7 +462,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "chunked regardless of their types."
             ),
         ),
-    ]
+    ] = None
     recursive: Annotated[
         bool,
         Field(
@@ -470,7 +473,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "Default is True."
             ),
         ),
-    ]
+    ] = True
     distance_threshold: Annotated[
         float,
         Field(
@@ -482,7 +485,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "Will be ignored if < 0. Default is -1."
             ),
         ),
-    ]
+    ] = -1
     n_results: Annotated[
         Optional[int],
         Field(
@@ -494,7 +497,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
                 "Use None or <1 to return all results."
             ),
         ),
-    ]
+    ] = None
     _embedding_function_string: Optional[str] = None
     _token_count_function_string: Optional[str] = None
@@ -538,7 +541,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
         self,
         name_prefix: Optional[str] = None,
         name_suffix: Optional[str] = None,
-    ) -> Tuple[str, str]:
+    ) -> tuple[str, str]:
         """Generate the custom embedding function.
         Parameters
@@ -550,7 +553,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
         Returns
         -------
-        Tuple[str, str]
+        tuple[str, str]
             The custom embedding function and the function name.
         """
         function_name = CUSTOM_EMBEDDING_FUNCTION
@@ -572,7 +575,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
         self,
         name_prefix: Optional[str] = None,
         name_suffix: Optional[str] = None,
-    ) -> Tuple[str, str]:
+    ) -> tuple[str, str]:
         """Generate the custom token count function.
         Parameters
@@ -584,7 +587,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
         Returns
         -------
-        Tuple[str, str]
+        tuple[str, str]
             The custom token count function and the function name.
         """
         function_name = CUSTOM_TOKEN_COUNT_FUNCTION
@@ -606,7 +609,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
         self,
         name_prefix: Optional[str] = None,
         name_suffix: Optional[str] = None,
-    ) -> Tuple[str, str]:
+    ) -> tuple[str, str]:
         """Generate the custom text split function.
         Parameters
@@ -618,7 +621,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
         Returns
         -------
-        Tuple[str, str]
+        tuple[str, str]
             The custom text split function and the function name.
         """
         function_name = CUSTOM_TEXT_SPLIT_FUNCTION
@@ -715,35 +718,50 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
         """
         if not self.docs_path:
             return
-        # if urls or directories ok, if files they should resolve
+        # Normalize to list
         doc_paths = (
             [self.docs_path]
             if isinstance(self.docs_path, str)
             else self.docs_path
         )
-        paths: List[str] = []
+        validated_paths: list[str] = []
         for path in doc_paths:
-            resolved = path
-            is_remote, is_raw = is_remote_path(resolved)
-            if is_remote:
-                if not is_raw:
-                    resolved = f'r"{resolved}"'
-                if resolved not in paths:
-                    paths.append(resolved)
+            # Skip duplicates
+            if path in validated_paths:
                 continue
-            resolved = remove_file_scheme(resolved)
-            is_raw = resolved.startswith(("r'", 'r"'))
-            maybe_folder = string_represents_folder(resolved)
-            if maybe_folder:
-                if not is_raw:
-                    resolved = f'r"{resolved}"'
-                if resolved not in paths:
-                    paths.append(resolved)
+            # Check if it's a remote path
+            is_remote = is_remote_path(path)
+            if is_remote:
+                # Remote paths: ensure proper raw string wrapping if needed
+                content = extract_raw_string_content(path)
+                validated_paths.append(f'r"{content}"')
                 continue
-            resolved = resolve_path(resolved, is_raw, not maybe_folder)
-            if resolved not in paths:
-                paths.append(resolved)
-        self.docs_path = paths
+            # Handle local paths
+            # First remove any file:// scheme
+            cleaned_path = remove_file_scheme(path)
+            content = extract_raw_string_content(cleaned_path)
+            # Determine if it's likely a folder
+            is_folder = string_represents_folder(content)
+            if is_folder:
+                validated_paths.append(f'r"{content}"')
+            else:
+                # Files: resolve and validate existence
+                try:
+                    resolved_path = resolve_path(cleaned_path, must_exist=True)
+                    validated_paths.append(resolved_path)
+                except ValueError as e:
+                    raise ValueError(f"Invalid file path '{path}': {e}") from e
+        # remove dupes (but keep order)
+        validated_paths = list(dict.fromkeys(validated_paths))
+        self.docs_path = [path for path in validated_paths if path]
     @model_validator(mode="after")
     def validate_rag_user_data(self) -> Self:
@@ -756,7 +774,7 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
         Returns
         -------
-        WaldiezRagUserData
+        WaldiezRagUserProxyData
             The validated RAG user data.
         """
         self.validate_custom_embedding_function()
@@ -764,12 +782,35 @@ class WaldiezRagUserRetrieveConfig(WaldiezBase):
         self.validate_custom_text_split_function()
         self.validate_docs_path()
         if not self.db_config.model:
-            self.db_config.model = WaldiezRagUserModels[self.vector_db]
+            self.db_config.model = WaldiezRagUserProxyModels[self.vector_db]
         if isinstance(self.n_results, int) and self.n_results < 1:
             self.n_results = None
         return self
+def extract_raw_string_content(path: str) -> str:
+    """Extract content from potential raw string formats.
+    Parameters
+    ----------
+    path : str
+        The path that might be wrapped in raw string format.
+    Returns
+    -------
+    str
+        The actual content of the path, without raw string formatting.
+    """
+    # Handle r"..." and r'...'
+    if path.startswith(('r"', "r'")) and len(path) > 3:
+        quote = path[1]
+        if path.endswith(quote):
+            return path[2:-1]
+        # Handle malformed raw strings (missing end quote)
+        return path[2:]
+    return path
 def string_represents_folder(path: str) -> bool:
     """Check if a string represents a folder.
@@ -783,14 +824,27 @@ def string_represents_folder(path: str) -> bool:
     bool
         True if the path is likely a folder, False if it's likely a file.
     """
-    if path.endswith(os.path.sep):
-        return True
-    if os.path.isdir(path):
+    # Extract actual path content if wrapped
+    content = extract_raw_string_content(path)
+    # Explicit folder indicators
+    if content.endswith(("/", "\\", os.path.sep)):
         return True
-    return not os.path.splitext(path)[1]
+    # Check if it actually exists and is a directory
+    try:
+        if os.path.isdir(content):
+            return True
+    except (OSError, ValueError):  # pragma: no cover
+        pass
+    # Heuristic: no file extension likely means folder
+    # return not os.path.splitext(content)[1]
+    _, ext = os.path.splitext(path.rstrip("/\\"))
+    return not ext
-def is_remote_path(path: str) -> Tuple[bool, bool]:
+def is_remote_path(path: str) -> bool:
     """Check if a path is a remote path.
     Parameters
@@ -800,14 +854,14 @@ def is_remote_path(path: str) -> Tuple[bool, bool]:
     Returns
     -------
-    Tuple[bool, bool]
+    tuple[bool, bool]
         If the path is a remote path and if it's a raw string.
     """
-    is_raw = path.startswith(("r'", 'r"'))
+    content = extract_raw_string_content(path)
     for not_local in NOT_LOCAL:
-        if path.startswith((not_local, f'r"{not_local}', f"r'{not_local}")):
-            return True, is_raw
-    return False, is_raw
+        if content.startswith((not_local, f'r"{not_local}', f"r'{not_local}")):
+            return True
+    return False
 def remove_file_scheme(path: str) -> str:
@@ -823,54 +877,68 @@ def remove_file_scheme(path: str) -> str:
     str
         The path without the scheme.
     """
-    resolved = str(path)
-    while resolved.startswith('r"file://') and resolved.endswith('"'):
-        resolved = resolved[len('r"file://') : -1]
-    while resolved.startswith("r'file://") and resolved.endswith("'"):
-        resolved = resolved[len("r'file://") : -1]
-    while resolved.startswith("file://"):
-        resolved = resolved[len("file://") :]
-    return resolved
+    content = extract_raw_string_content(path)
+    # Remove file:// prefix
+    while content.startswith("file://"):
+        content = content[len("file://") :]
+    return f'r"{content}"'
-def resolve_path(path: str, is_raw: bool, must_exist: bool) -> str:
+def resolve_path(path: str, must_exist: bool) -> str:
     """Try to resolve a path.
     Parameters
     ----------
     path : str
         The path to resolve.
-    is_raw : bool
-        If the path is a raw string.
     must_exist : bool
         If the path must exist.
     Returns
     -------
-    Path
-        The resolved path.
+    str
+        The resolved path, potentially wrapped in raw string format.
     Raises
     ------
     ValueError
         If the path is not a valid local path.
     """
-    # pylint: disable=broad-except
-    path_string = path
-    if is_raw:
-        path_string = path[2:-1]
+    # Extract the actual path content
+    # if is_raw:
+    path_content = extract_raw_string_content(path)
+    # else:
+    #     path_content = path
+    # Handle JSON-escaped backslashes
+    if "\\\\" in path_content:  # pragma: no cover
+        path_content = path_content.replace("\\\\", "\\")
+    # pylint: disable=too-many-try-statements
     try:
-        resolved = Path(path_string).resolve()
-    except BaseException as error:  # pragma: no cover
-        # check if 'r'... is needed
-        raw_string = f'r"{path}"'
+        # Try to resolve the path
+        resolved = Path(path_content).resolve()
+        if must_exist and not resolved.exists():
+            raise ValueError(f"Path {path} does not exist.")
+        return f'r"{resolved}"'
+    except (
+        OSError,
+        UnicodeDecodeError,
+        ValueError,
+    ) as error:  # pragma: no cover
+        # Fallback: try as raw string for Windows compatibility
+        raw_version = f'r"{path_content}"'
         try:
-            Path(raw_string).resolve()
-        except BaseException:
+            # Test if the path can be resolved when treated as raw
+            resolved = Path(raw_version).resolve()
+            if must_exist and not resolved.exists():
+                raise ValueError(f"Path {path} does not exist.") from error
+            return raw_version
+        except Exception:
             raise ValueError(
-                f"Path {path} is not a valid local path."
+                f"Path {path} is not a valid local path: {error}"
             ) from error
-        return raw_string
-    if not resolved.exists() and must_exist:
-        raise ValueError(f"Path {path} does not exist.")
-    return f'r"{resolved}"'

waldiez 0.4.7__py3-none-any.whl → 0.4.8__py3-none-any.whl

Potentially problematic release.

waldiez 0.4.7py3-none-any.whl → 0.4.8py3-none-any.whl