PyPI - lfx-nightly - Versions diffs - 0.2.0.dev26__py3-none-any.whl → 0.2.1.dev7__py3-none-any.whl - Mend

lfx-nightly 0.2.0.dev26py3-none-any.whl → 0.2.1.dev7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (85) hide show

lfx/_assets/component_index.json +1 -1
lfx/base/agents/agent.py +9 -4
lfx/base/agents/altk_base_agent.py +16 -3
lfx/base/agents/altk_tool_wrappers.py +1 -1
lfx/base/agents/utils.py +4 -0
lfx/base/composio/composio_base.py +78 -41
lfx/base/data/base_file.py +14 -4
lfx/base/data/cloud_storage_utils.py +156 -0
lfx/base/data/docling_utils.py +191 -65
lfx/base/data/storage_utils.py +109 -0
lfx/base/datastax/astradb_base.py +75 -64
lfx/base/mcp/util.py +2 -2
lfx/base/models/__init__.py +11 -1
lfx/base/models/anthropic_constants.py +21 -12
lfx/base/models/google_generative_ai_constants.py +33 -9
lfx/base/models/model_metadata.py +6 -0
lfx/base/models/ollama_constants.py +196 -30
lfx/base/models/openai_constants.py +37 -10
lfx/base/models/unified_models.py +1123 -0
lfx/base/models/watsonx_constants.py +36 -0
lfx/base/tools/component_tool.py +2 -9
lfx/cli/commands.py +6 -1
lfx/cli/run.py +65 -409
lfx/cli/script_loader.py +13 -3
lfx/components/__init__.py +0 -3
lfx/components/composio/github_composio.py +1 -1
lfx/components/cuga/cuga_agent.py +39 -27
lfx/components/data_source/api_request.py +4 -2
lfx/components/docling/__init__.py +45 -11
lfx/components/docling/chunk_docling_document.py +3 -1
lfx/components/docling/docling_inline.py +39 -49
lfx/components/docling/export_docling_document.py +3 -1
lfx/components/elastic/opensearch_multimodal.py +215 -57
lfx/components/files_and_knowledge/file.py +439 -39
lfx/components/files_and_knowledge/ingestion.py +8 -0
lfx/components/files_and_knowledge/retrieval.py +10 -0
lfx/components/files_and_knowledge/save_file.py +123 -53
lfx/components/ibm/watsonx.py +7 -1
lfx/components/input_output/chat_output.py +7 -1
lfx/components/langchain_utilities/tool_calling.py +14 -6
lfx/components/llm_operations/batch_run.py +80 -25
lfx/components/llm_operations/lambda_filter.py +33 -6
lfx/components/llm_operations/llm_conditional_router.py +39 -7
lfx/components/llm_operations/structured_output.py +38 -12
lfx/components/models/__init__.py +16 -74
lfx/components/models_and_agents/agent.py +51 -201
lfx/components/models_and_agents/embedding_model.py +185 -339
lfx/components/models_and_agents/language_model.py +54 -318
lfx/components/models_and_agents/mcp_component.py +58 -9
lfx/components/ollama/ollama.py +9 -4
lfx/components/ollama/ollama_embeddings.py +2 -1
lfx/components/openai/openai_chat_model.py +1 -1
lfx/components/processing/__init__.py +0 -3
lfx/components/vllm/__init__.py +37 -0
lfx/components/vllm/vllm.py +141 -0
lfx/components/vllm/vllm_embeddings.py +110 -0
lfx/custom/custom_component/custom_component.py +8 -6
lfx/custom/directory_reader/directory_reader.py +5 -2
lfx/graph/utils.py +64 -18
lfx/inputs/__init__.py +2 -0
lfx/inputs/input_mixin.py +54 -0
lfx/inputs/inputs.py +115 -0
lfx/interface/initialize/loading.py +42 -12
lfx/io/__init__.py +2 -0
lfx/run/__init__.py +5 -0
lfx/run/base.py +494 -0
lfx/schema/data.py +1 -1
lfx/schema/image.py +28 -19
lfx/schema/message.py +19 -3
lfx/services/interfaces.py +5 -0
lfx/services/manager.py +5 -4
lfx/services/mcp_composer/service.py +45 -13
lfx/services/settings/auth.py +18 -11
lfx/services/settings/base.py +12 -24
lfx/services/settings/constants.py +2 -0
lfx/services/storage/local.py +37 -0
lfx/services/storage/service.py +19 -0
lfx/utils/constants.py +1 -0
lfx/utils/image.py +29 -11
lfx/utils/validate_cloud.py +14 -3
{lfx_nightly-0.2.0.dev26.dist-info → lfx_nightly-0.2.1.dev7.dist-info}/METADATA +5 -2
{lfx_nightly-0.2.0.dev26.dist-info → lfx_nightly-0.2.1.dev7.dist-info}/RECORD +84 -78
lfx/components/processing/dataframe_to_toolset.py +0 -259
{lfx_nightly-0.2.0.dev26.dist-info → lfx_nightly-0.2.1.dev7.dist-info}/WHEEL +0 -0
{lfx_nightly-0.2.0.dev26.dist-info → lfx_nightly-0.2.1.dev7.dist-info}/entry_points.txt +0 -0

lfx/base/agents/agent.py CHANGED Viewed

@@ -71,8 +71,8 @@ class LCAgentComponent(Component):
     ]
     outputs = [
-        Output(display_name="Agent", name="agent", method="build_agent", hidden=True, tool_mode=False),
         Output(display_name="Response", name="response", method="message_response"),
+        Output(display_name="Agent", name="agent", method="build_agent", tool_mode=False),
     ]
     # Get shared callbacks for tracing and save them to self.shared_callbacks
@@ -181,7 +181,11 @@ class LCAgentComponent(Component):
         else:
             input_dict = {"input": self.input_value}
-        if hasattr(self, "system_prompt"):
+        # Ensure input_dict is initialized
+        if "input" not in input_dict:
+            input_dict = {"input": self.input_value}
+        if hasattr(self, "system_prompt") and self.system_prompt and self.system_prompt.strip():
             input_dict["system_prompt"] = self.system_prompt
         if hasattr(self, "chat_history") and self.chat_history:
@@ -196,8 +200,9 @@ class LCAgentComponent(Component):
         # Note: Agent input must be a string, so we extract text and move images to chat_history
         if lc_message is not None and hasattr(lc_message, "content") and isinstance(lc_message.content, list):
             # Extract images and text from the text content items
-            image_dicts = [item for item in lc_message.content if item.get("type") == "image"]
-            text_content = [item for item in lc_message.content if item.get("type") != "image"]
+            # Support both "image" (legacy) and "image_url" (standard) types
+            image_dicts = [item for item in lc_message.content if item.get("type") in ("image", "image_url")]
+            text_content = [item for item in lc_message.content if item.get("type") not in ("image", "image_url")]
             text_strings = [
                 item.get("text", "")

lfx/base/agents/altk_base_agent.py CHANGED Viewed

@@ -319,9 +319,9 @@ class ALTKBaseAgentComponent(AgentComponent):
                 input_dict["chat_history"] = data_to_messages([m.to_data() for m in self.chat_history])
         if hasattr(lc_message, "content") and isinstance(lc_message.content, list):
             # ! Because the input has to be a string, we must pass the images in the chat_history
-            image_dicts = [item for item in lc_message.content if item.get("type") == "image"]
-            lc_message.content = [item for item in lc_message.content if item.get("type") != "image"]
+            # Support both "image" (legacy) and "image_url" (standard) types
+            image_dicts = [item for item in lc_message.content if item.get("type") in ("image", "image_url")]
+            lc_message.content = [item for item in lc_message.content if item.get("type") not in ("image", "image_url")]
             if "chat_history" not in input_dict:
                 input_dict["chat_history"] = []
@@ -330,6 +330,19 @@ class ALTKBaseAgentComponent(AgentComponent):
             else:
                 input_dict["chat_history"] = [HumanMessage(content=[image_dict]) for image_dict in image_dicts]
         input_dict["input"] = input_text
+        # Copied from agent.py
+        # Final safety check: ensure input is never empty (prevents Anthropic API errors)
+        current_input = input_dict.get("input", "")
+        if isinstance(current_input, list):
+            current_input = " ".join(map(str, current_input))
+        elif not isinstance(current_input, str):
+            current_input = str(current_input)
+        if not current_input.strip():
+            input_dict["input"] = "Continue the conversation."
+        else:
+            input_dict["input"] = current_input
         if hasattr(self, "graph"):
             session_id = self.graph.session_id
         elif hasattr(self, "_session_id"):

lfx/base/agents/altk_tool_wrappers.py CHANGED Viewed

@@ -513,7 +513,7 @@ class PostToolProcessor(ALTKBaseTool):
                 output = None
                 try:
                     output = middleware.process(input_data, AgentPhase.RUNTIME)
-                except (AttributeError, TypeError, ValueError, RuntimeError) as e:
+                except Exception as e:  # noqa: BLE001
                     logger.error(f"Exception in executing CodeGenerationComponent: {e}")
                 if output is not None and hasattr(output, "result"):
                     logger.info(f"Output of CodeGenerationComponent: {output.result}")

lfx/base/agents/utils.py CHANGED Viewed

@@ -224,6 +224,10 @@ def get_chat_output_sender_name(self) -> str | None:
     if not hasattr(self, "graph") or not self.graph:
         return None
+    # Check if graph has vertices attribute (PlaceholderGraph doesn't)
+    if not hasattr(self.graph, "vertices"):
+        return None
     for vertex in self.graph.vertices:
         # Safely check if vertex has data attribute, correct type, and raw_params
         if (

lfx/base/composio/composio_base.py CHANGED Viewed

@@ -41,6 +41,58 @@ class ComposioBaseComponent(Component):
     default_tools_limit: int = 5
+    # Reserved attribute names that conflict with Component base class
+    RESERVED_ATTRIBUTES: set[str] = {
+        # Core component attributes
+        "name",
+        "description",
+        "status",
+        "display_name",
+        "icon",
+        "priority",
+        "code",
+        "inputs",
+        "outputs",
+        "selected_output",
+        # Properties and methods
+        "trace_type",
+        "trace_name",
+        "function",
+        "repr_value",
+        "field_config",
+        "field_order",
+        "frozen",
+        "build_parameters",
+        "cache",
+        "tools_metadata",
+        "vertex",
+        # User and session attributes
+        "user_id",  # Already handled separately but included for completeness
+        "session_id",
+        "flow_id",
+        "flow_name",
+        "context",
+        # Common method names
+        "build",
+        "run",
+        "stop",
+        "start",
+        "validate",
+        "get_function",
+        "set_attributes",
+        # Additional common conflicts
+        "id",
+        "type",
+        "value",
+        "metadata",
+        "logs",
+        "results",
+        "artifacts",
+        "parameters",
+        "template",
+        "config",
+    }
     _base_inputs = [
         MessageTextInput(
             name="entity_id",
@@ -623,13 +675,9 @@ class ComposioBaseComponent(Component):
                                 attachment_related_found = True
                                 continue  # Skip individual attachment fields
-                            # Handle conflicting field names - rename user_id to avoid conflicts with entity_id
-                            if clean_field == "user_id":
-                                clean_field = f"{self.app_name}_user_id"
-                            # Handle reserved attribute name conflicts (e.g., 'status', 'name')
+                            # Handle reserved attribute name conflicts
                             # Prefix with app name to prevent clashes with component attributes
-                            if clean_field in {"status", "name"}:
+                            if clean_field in self.RESERVED_ATTRIBUTES:
                                 clean_field = f"{self.app_name}_{clean_field}"
                             action_fields.append(clean_field)
@@ -795,28 +843,16 @@ class ComposioBaseComponent(Component):
                     # Don't add individual attachment sub-fields to the schema
                     continue
-                # Handle conflicting field names - rename user_id to avoid conflicts with entity_id
-                if clean_field_name == "user_id":
-                    clean_field_name = f"{self.app_name}_user_id"
+                # Handle reserved attribute name conflicts
+                if clean_field_name in self.RESERVED_ATTRIBUTES:
+                    original_name = clean_field_name
+                    clean_field_name = f"{self.app_name}_{clean_field_name}"
                     # Update the field schema description to reflect the name change
                     field_schema_copy = field_schema.copy()
+                    original_description = field_schema.get("description", "")
                     field_schema_copy["description"] = (
-                        f"User ID for {self.app_name.title()}: " + field_schema["description"]
-                    )
-                elif clean_field_name == "status":
-                    clean_field_name = f"{self.app_name}_status"
-                    # Update the field schema description to reflect the name change
-                    field_schema_copy = field_schema.copy()
-                    field_schema_copy["description"] = f"Status for {self.app_name.title()}: " + field_schema.get(
-                        "description", ""
-                    )
-                elif clean_field_name == "name":
-                    clean_field_name = f"{self.app_name}_name"
-                    # Update the field schema description to reflect the name change
-                    field_schema_copy = field_schema.copy()
-                    field_schema_copy["description"] = f"Name for {self.app_name.title()}: " + field_schema.get(
-                        "description", ""
-                    )
+                        f"{original_name.replace('_', ' ').title()} for {self.app_name.title()}: {original_description}"
+                    ).strip()
                 else:
                     # Use the original field schema for all other fields
                     field_schema_copy = field_schema
@@ -842,12 +878,8 @@ class ComposioBaseComponent(Component):
                 cleaned_required = []
                 for field in flat_schema["required"]:
                     base = field.replace("[0]", "")
-                    if base == "user_id":
-                        cleaned_required.append(f"{self.app_name}_user_id")
-                    elif base == "status":
-                        cleaned_required.append(f"{self.app_name}_status")
-                    elif base == "name":
-                        cleaned_required.append(f"{self.app_name}_name")
+                    if base in self.RESERVED_ATTRIBUTES:
+                        cleaned_required.append(f"{self.app_name}_{base}")
                     else:
                         cleaned_required.append(base)
                 flat_schema["required"] = cleaned_required
@@ -943,9 +975,10 @@ class ComposioBaseComponent(Component):
                                 inp.advanced = True
                             # Skip entity_id being mapped to user_id parameter
-                            if inp.name == "user_id" and getattr(self, "entity_id", None) == getattr(
-                                inp, "value", None
-                            ):
+                            # Check both original name and renamed version
+                            if inp.name in {"user_id", f"{self.app_name}_user_id"} and getattr(
+                                self, "entity_id", None
+                            ) == getattr(inp, "value", None):
                                 continue
                             processed_inputs.append(inp)
@@ -2422,12 +2455,11 @@ class ComposioBaseComponent(Component):
                 # Handle renamed fields - map back to original names for API execution
                 final_field_name = field
-                if field.endswith("_user_id") and field.startswith(self.app_name):
-                    final_field_name = "user_id"
-                elif field == f"{self.app_name}_status":
-                    final_field_name = "status"
-                elif field == f"{self.app_name}_name":
-                    final_field_name = "name"
+                # Check if this is a renamed reserved attribute
+                if field.startswith(f"{self.app_name}_"):
+                    potential_original = field[len(self.app_name) + 1 :]  # Remove app_name prefix
+                    if potential_original in self.RESERVED_ATTRIBUTES:
+                        final_field_name = potential_original
                 arguments[final_field_name] = value
@@ -2538,7 +2570,7 @@ class ComposioBaseComponent(Component):
                 build_config[fname]["value"] = "" if fname not in self._bool_variables else False
         # Hide any other visible, non-protected fields that look like parameters
         protected = {
-            "code",
+            # Component control fields
             "entity_id",
             "api_key",
             "auth_link",
@@ -2570,6 +2602,11 @@ class ComposioBaseComponent(Component):
             "instance_url",
             "tenant_id",
         }
+        # Add all reserved Component attributes to protected set
+        protected.update(self.RESERVED_ATTRIBUTES)
+        # Also add the renamed versions (with app_name prefix) to protected set
+        for attr in self.RESERVED_ATTRIBUTES:
+            protected.add(f"{self.app_name}_{attr}")
         # Add all dynamic auth fields to protected set
         protected.update(self._auth_dynamic_fields)
         # Also protect any auth fields discovered across all instances

lfx/base/data/base_file.py CHANGED Viewed

@@ -260,8 +260,6 @@ class BaseFileComponent(Component, ABC):
         filename = file_path_obj.name
         settings = get_settings_service().settings
-        # Get file size - use storage service for S3, filesystem for local
         if settings.storage_type == "s3":
             try:
                 file_size = get_file_size(file_path)
@@ -618,9 +616,21 @@ class BaseFileComponent(Component, ABC):
                     BaseFileComponent.BaseFile(data, Path(path_str), delete_after_processing=delete_after_processing)
                 )
             else:
-                resolved_path = Path(self.resolve_path(path_str))
+                # Check if path looks like a storage path (flow_id/filename format)
+                # If so, use get_full_path to resolve it to the actual storage location
+                if "/" in path_str and not Path(path_str).is_absolute():
+                    try:
+                        resolved_path = Path(self.get_full_path(path_str))
+                        self.log(f"Resolved storage path '{path_str}' to '{resolved_path}'")
+                    except (ValueError, AttributeError) as e:
+                        # Fallback to resolve_path if get_full_path fails
+                        self.log(f"get_full_path failed for '{path_str}': {e}, falling back to resolve_path")
+                        resolved_path = Path(self.resolve_path(path_str))
+                else:
+                    resolved_path = Path(self.resolve_path(path_str))
                 if not resolved_path.exists():
-                    msg = f"File or directory not found: {path}"
+                    msg = f"File not found: '{path}' (resolved to: '{resolved_path}'). Please upload the file again."
                     self.log(msg)
                     if not self.silent_errors:
                         raise ValueError(msg)

lfx/base/data/cloud_storage_utils.py ADDED Viewed

@@ -0,0 +1,156 @@
+"""Shared utilities for cloud storage operations (AWS S3 and Google Drive).
+This module provides common functionality used by both read and write file components
+to avoid code duplication.
+"""
+from __future__ import annotations
+import json
+from typing import Any
+def validate_aws_credentials(component: Any) -> None:
+    """Validate that required AWS S3 credentials are present.
+    Args:
+        component: Component instance with AWS credential attributes
+    Raises:
+        ValueError: If any required credential is missing
+    """
+    if not getattr(component, "aws_access_key_id", None):
+        msg = "AWS Access Key ID is required for S3 storage"
+        raise ValueError(msg)
+    if not getattr(component, "aws_secret_access_key", None):
+        msg = "AWS Secret Key is required for S3 storage"
+        raise ValueError(msg)
+    if not getattr(component, "bucket_name", None):
+        msg = "S3 Bucket Name is required for S3 storage"
+        raise ValueError(msg)
+def create_s3_client(component: Any):
+    """Create and return a configured boto3 S3 client.
+    Args:
+        component: Component instance with AWS credential attributes
+    Returns:
+        boto3 S3 client instance
+    Raises:
+        ImportError: If boto3 is not installed
+    """
+    try:
+        import boto3
+    except ImportError as e:
+        msg = "boto3 is not installed. Please install it using `uv pip install boto3`."
+        raise ImportError(msg) from e
+    client_config = {
+        "aws_access_key_id": component.aws_access_key_id,
+        "aws_secret_access_key": component.aws_secret_access_key,
+    }
+    if hasattr(component, "aws_region") and component.aws_region:
+        client_config["region_name"] = component.aws_region
+    return boto3.client("s3", **client_config)
+def parse_google_service_account_key(service_account_key: str) -> dict:
+    """Parse Google service account JSON key with multiple fallback strategies.
+    This function handles various common formatting issues when users paste
+    service account keys, including:
+    - Control characters
+    - Extra whitespace
+    - Double-encoded JSON strings
+    - Escaped newlines in private_key field
+    Args:
+        service_account_key: Service account JSON key as string
+    Returns:
+        dict: Parsed service account credentials
+    Raises:
+        ValueError: If all parsing strategies fail
+    """
+    credentials_dict = None
+    parse_errors = []
+    # Strategy 1: Parse as-is with strict=False to allow control characters
+    try:
+        credentials_dict = json.loads(service_account_key, strict=False)
+    except json.JSONDecodeError as e:
+        parse_errors.append(f"Standard parse: {e!s}")
+    # Strategy 2: Strip whitespace and try again
+    if credentials_dict is None:
+        try:
+            cleaned_key = service_account_key.strip()
+            credentials_dict = json.loads(cleaned_key, strict=False)
+        except json.JSONDecodeError as e:
+            parse_errors.append(f"Stripped parse: {e!s}")
+    # Strategy 3: Check if it's double-encoded (JSON string of a JSON string)
+    if credentials_dict is None:
+        try:
+            decoded_once = json.loads(service_account_key, strict=False)
+            credentials_dict = json.loads(decoded_once, strict=False) if isinstance(decoded_once, str) else decoded_once
+        except json.JSONDecodeError as e:
+            parse_errors.append(f"Double-encoded parse: {e!s}")
+    # Strategy 4: Try to fix common issues with newlines in the private_key field
+    if credentials_dict is None:
+        try:
+            # Replace literal \n with actual newlines which is common in pasted JSON
+            fixed_key = service_account_key.replace("\\n", "\n")
+            credentials_dict = json.loads(fixed_key, strict=False)
+        except json.JSONDecodeError as e:
+            parse_errors.append(f"Newline-fixed parse: {e!s}")
+    if credentials_dict is None:
+        error_details = "; ".join(parse_errors)
+        msg = (
+            f"Unable to parse service account key JSON. Tried multiple strategies: {error_details}. "
+            "Please ensure you've copied the entire JSON content from your service account key file. "
+            "The JSON should start with '{' and contain fields like 'type', 'project_id', 'private_key', etc."
+        )
+        raise ValueError(msg)
+    return credentials_dict
+def create_google_drive_service(service_account_key: str, scopes: list[str], *, return_credentials: bool = False):
+    """Create and return a configured Google Drive API service.
+    Args:
+        service_account_key: Service account JSON key as string
+        scopes: List of Google API scopes to request
+        return_credentials: If True, return both service and credentials as tuple
+    Returns:
+        Google Drive API service instance, or tuple of (service, credentials) if return_credentials=True
+    Raises:
+        ImportError: If Google API client libraries are not installed
+        ValueError: If credentials cannot be parsed
+    """
+    try:
+        from google.oauth2 import service_account
+        from googleapiclient.discovery import build
+    except ImportError as e:
+        msg = "Google API client libraries are not installed. Please install them."
+        raise ImportError(msg) from e
+    credentials_dict = parse_google_service_account_key(service_account_key)
+    credentials = service_account.Credentials.from_service_account_info(credentials_dict, scopes=scopes)
+    service = build("drive", "v3", credentials=credentials)
+    if return_credentials:
+        return service, credentials
+    return service

lfx-nightly 0.2.0.dev26__py3-none-any.whl → 0.2.1.dev7__py3-none-any.whl

lfx-nightly 0.2.0.dev26py3-none-any.whl → 0.2.1.dev7py3-none-any.whl