PyPI - lfx-nightly - Versions diffs - 0.2.0.dev0__py3-none-any.whl → 0.2.0.dev41__py3-none-any.whl - Mend

lfx-nightly 0.2.0.dev0py3-none-any.whl → 0.2.0.dev41py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (196) hide show

lfx/_assets/component_index.json +1 -1
lfx/base/agents/agent.py +21 -4
lfx/base/agents/altk_base_agent.py +393 -0
lfx/base/agents/altk_tool_wrappers.py +565 -0
lfx/base/agents/events.py +2 -1
lfx/base/composio/composio_base.py +159 -224
lfx/base/data/base_file.py +97 -20
lfx/base/data/docling_utils.py +61 -10
lfx/base/data/storage_utils.py +301 -0
lfx/base/data/utils.py +178 -14
lfx/base/mcp/util.py +2 -2
lfx/base/models/anthropic_constants.py +21 -12
lfx/base/models/groq_constants.py +74 -58
lfx/base/models/groq_model_discovery.py +265 -0
lfx/base/models/model.py +1 -1
lfx/base/models/model_utils.py +100 -0
lfx/base/models/openai_constants.py +7 -0
lfx/base/models/watsonx_constants.py +32 -8
lfx/base/tools/run_flow.py +601 -129
lfx/cli/commands.py +9 -4
lfx/cli/common.py +2 -2
lfx/cli/run.py +1 -1
lfx/cli/script_loader.py +53 -11
lfx/components/Notion/create_page.py +1 -1
lfx/components/Notion/list_database_properties.py +1 -1
lfx/components/Notion/list_pages.py +1 -1
lfx/components/Notion/list_users.py +1 -1
lfx/components/Notion/page_content_viewer.py +1 -1
lfx/components/Notion/search.py +1 -1
lfx/components/Notion/update_page_property.py +1 -1
lfx/components/__init__.py +19 -5
lfx/components/{agents → altk}/__init__.py +5 -9
lfx/components/altk/altk_agent.py +193 -0
lfx/components/apify/apify_actor.py +1 -1
lfx/components/composio/__init__.py +70 -18
lfx/components/composio/apollo_composio.py +11 -0
lfx/components/composio/bitbucket_composio.py +11 -0
lfx/components/composio/canva_composio.py +11 -0
lfx/components/composio/coda_composio.py +11 -0
lfx/components/composio/composio_api.py +10 -0
lfx/components/composio/discord_composio.py +1 -1
lfx/components/composio/elevenlabs_composio.py +11 -0
lfx/components/composio/exa_composio.py +11 -0
lfx/components/composio/firecrawl_composio.py +11 -0
lfx/components/composio/fireflies_composio.py +11 -0
lfx/components/composio/gmail_composio.py +1 -1
lfx/components/composio/googlebigquery_composio.py +11 -0
lfx/components/composio/googlecalendar_composio.py +1 -1
lfx/components/composio/googledocs_composio.py +1 -1
lfx/components/composio/googlemeet_composio.py +1 -1
lfx/components/composio/googlesheets_composio.py +1 -1
lfx/components/composio/googletasks_composio.py +1 -1
lfx/components/composio/heygen_composio.py +11 -0
lfx/components/composio/mem0_composio.py +11 -0
lfx/components/composio/peopledatalabs_composio.py +11 -0
lfx/components/composio/perplexityai_composio.py +11 -0
lfx/components/composio/serpapi_composio.py +11 -0
lfx/components/composio/slack_composio.py +3 -574
lfx/components/composio/slackbot_composio.py +1 -1
lfx/components/composio/snowflake_composio.py +11 -0
lfx/components/composio/tavily_composio.py +11 -0
lfx/components/composio/youtube_composio.py +2 -2
lfx/components/cuga/__init__.py +34 -0
lfx/components/cuga/cuga_agent.py +730 -0
lfx/components/data/__init__.py +78 -28
lfx/components/data_source/__init__.py +58 -0
lfx/components/{data → data_source}/api_request.py +26 -3
lfx/components/{data → data_source}/csv_to_data.py +15 -10
lfx/components/{data → data_source}/json_to_data.py +15 -8
lfx/components/{data → data_source}/news_search.py +1 -1
lfx/components/{data → data_source}/rss.py +1 -1
lfx/components/{data → data_source}/sql_executor.py +1 -1
lfx/components/{data → data_source}/url.py +1 -1
lfx/components/{data → data_source}/web_search.py +1 -1
lfx/components/datastax/astradb_cql.py +1 -1
lfx/components/datastax/astradb_graph.py +1 -1
lfx/components/datastax/astradb_tool.py +1 -1
lfx/components/datastax/astradb_vectorstore.py +1 -1
lfx/components/datastax/hcd.py +1 -1
lfx/components/deactivated/json_document_builder.py +1 -1
lfx/components/docling/__init__.py +0 -3
lfx/components/docling/chunk_docling_document.py +3 -1
lfx/components/docling/export_docling_document.py +3 -1
lfx/components/elastic/elasticsearch.py +1 -1
lfx/components/files_and_knowledge/__init__.py +47 -0
lfx/components/{data → files_and_knowledge}/directory.py +1 -1
lfx/components/{data → files_and_knowledge}/file.py +304 -24
lfx/components/{knowledge_bases → files_and_knowledge}/retrieval.py +2 -2
lfx/components/{data → files_and_knowledge}/save_file.py +218 -31
lfx/components/flow_controls/__init__.py +58 -0
lfx/components/{logic → flow_controls}/conditional_router.py +1 -1
lfx/components/{logic → flow_controls}/loop.py +43 -9
lfx/components/flow_controls/run_flow.py +108 -0
lfx/components/glean/glean_search_api.py +1 -1
lfx/components/groq/groq.py +35 -28
lfx/components/helpers/__init__.py +102 -0
lfx/components/ibm/watsonx.py +7 -1
lfx/components/input_output/__init__.py +3 -1
lfx/components/input_output/chat.py +4 -3
lfx/components/input_output/chat_output.py +10 -4
lfx/components/input_output/text.py +1 -1
lfx/components/input_output/text_output.py +1 -1
lfx/components/{data → input_output}/webhook.py +1 -1
lfx/components/knowledge_bases/__init__.py +59 -4
lfx/components/langchain_utilities/character.py +1 -1
lfx/components/langchain_utilities/csv_agent.py +84 -16
lfx/components/langchain_utilities/json_agent.py +67 -12
lfx/components/langchain_utilities/language_recursive.py +1 -1
lfx/components/llm_operations/__init__.py +46 -0
lfx/components/{processing → llm_operations}/batch_run.py +17 -8
lfx/components/{processing → llm_operations}/lambda_filter.py +1 -1
lfx/components/{logic → llm_operations}/llm_conditional_router.py +1 -1
lfx/components/{processing/llm_router.py → llm_operations/llm_selector.py} +3 -3
lfx/components/{processing → llm_operations}/structured_output.py +1 -1
lfx/components/logic/__init__.py +126 -0
lfx/components/mem0/mem0_chat_memory.py +11 -0
lfx/components/models/__init__.py +64 -9
lfx/components/models_and_agents/__init__.py +49 -0
lfx/components/{agents → models_and_agents}/agent.py +6 -4
lfx/components/models_and_agents/embedding_model.py +353 -0
lfx/components/models_and_agents/language_model.py +398 -0
lfx/components/{agents → models_and_agents}/mcp_component.py +53 -44
lfx/components/{helpers → models_and_agents}/memory.py +1 -1
lfx/components/nvidia/system_assist.py +1 -1
lfx/components/olivya/olivya.py +1 -1
lfx/components/ollama/ollama.py +24 -5
lfx/components/processing/__init__.py +9 -60
lfx/components/processing/converter.py +1 -1
lfx/components/processing/dataframe_operations.py +1 -1
lfx/components/processing/parse_json_data.py +2 -2
lfx/components/processing/parser.py +1 -1
lfx/components/processing/split_text.py +1 -1
lfx/components/qdrant/qdrant.py +1 -1
lfx/components/redis/redis.py +1 -1
lfx/components/twelvelabs/split_video.py +10 -0
lfx/components/twelvelabs/video_file.py +12 -0
lfx/components/utilities/__init__.py +43 -0
lfx/components/{helpers → utilities}/calculator_core.py +1 -1
lfx/components/{helpers → utilities}/current_date.py +1 -1
lfx/components/{processing → utilities}/python_repl_core.py +1 -1
lfx/components/vectorstores/local_db.py +9 -0
lfx/components/youtube/youtube_transcripts.py +118 -30
lfx/custom/custom_component/component.py +57 -1
lfx/custom/custom_component/custom_component.py +68 -6
lfx/custom/directory_reader/directory_reader.py +5 -2
lfx/graph/edge/base.py +43 -20
lfx/graph/state/model.py +15 -2
lfx/graph/utils.py +6 -0
lfx/graph/vertex/param_handler.py +10 -7
lfx/helpers/__init__.py +12 -0
lfx/helpers/flow.py +117 -0
lfx/inputs/input_mixin.py +24 -1
lfx/inputs/inputs.py +13 -1
lfx/interface/components.py +161 -83
lfx/log/logger.py +5 -3
lfx/schema/image.py +2 -12
lfx/services/database/__init__.py +5 -0
lfx/services/database/service.py +25 -0
lfx/services/deps.py +87 -22
lfx/services/interfaces.py +5 -0
lfx/services/manager.py +24 -10
lfx/services/mcp_composer/service.py +1029 -162
lfx/services/session.py +5 -0
lfx/services/settings/auth.py +18 -11
lfx/services/settings/base.py +56 -30
lfx/services/settings/constants.py +8 -0
lfx/services/storage/local.py +108 -46
lfx/services/storage/service.py +171 -29
lfx/template/field/base.py +3 -0
lfx/utils/image.py +29 -11
lfx/utils/ssrf_protection.py +384 -0
lfx/utils/validate_cloud.py +26 -0
{lfx_nightly-0.2.0.dev0.dist-info → lfx_nightly-0.2.0.dev41.dist-info}/METADATA +38 -22
{lfx_nightly-0.2.0.dev0.dist-info → lfx_nightly-0.2.0.dev41.dist-info}/RECORD +189 -160
{lfx_nightly-0.2.0.dev0.dist-info → lfx_nightly-0.2.0.dev41.dist-info}/WHEEL +1 -1
lfx/components/agents/altk_agent.py +0 -366
lfx/components/agents/cuga_agent.py +0 -1013
lfx/components/docling/docling_remote_vlm.py +0 -284
lfx/components/logic/run_flow.py +0 -71
lfx/components/models/embedding_model.py +0 -195
lfx/components/models/language_model.py +0 -144
lfx/components/processing/dataframe_to_toolset.py +0 -259
/lfx/components/{data → data_source}/mock_data.py +0 -0
/lfx/components/{knowledge_bases → files_and_knowledge}/ingestion.py +0 -0
/lfx/components/{logic → flow_controls}/data_conditional_router.py +0 -0
/lfx/components/{logic → flow_controls}/flow_tool.py +0 -0
/lfx/components/{logic → flow_controls}/listen.py +0 -0
/lfx/components/{logic → flow_controls}/notify.py +0 -0
/lfx/components/{logic → flow_controls}/pass_message.py +0 -0
/lfx/components/{logic → flow_controls}/sub_flow.py +0 -0
/lfx/components/{processing → models_and_agents}/prompt.py +0 -0
/lfx/components/{helpers → processing}/create_list.py +0 -0
/lfx/components/{helpers → processing}/output_parser.py +0 -0
/lfx/components/{helpers → processing}/store_message.py +0 -0
/lfx/components/{helpers → utilities}/id_generator.py +0 -0
{lfx_nightly-0.2.0.dev0.dist-info → lfx_nightly-0.2.0.dev41.dist-info}/entry_points.txt +0 -0

lfx/components/ollama/ollama.py CHANGED Viewed

@@ -101,6 +101,7 @@ class ChatOllamaComponent(LCModelComponent):
             info="Refer to https://ollama.com/library for more models.",
             refresh_button=True,
             real_time_refresh=True,
+            required=True,
         ),
         SecretStrInput(
             name="api_key",
@@ -122,9 +123,9 @@ class ChatOllamaComponent(LCModelComponent):
             name="format",
             display_name="Format",
             info="Specify the format of the output.",
-            advanced=False,
             table_schema=TABLE_SCHEMA,
             value=default_table_row,
+            show=False,
         ),
         DictInput(name="metadata", display_name="Metadata", info="Metadata to add to the run trace.", advanced=True),
         DropdownInput(
@@ -215,6 +216,14 @@ class ChatOllamaComponent(LCModelComponent):
         MessageTextInput(
             name="template", display_name="Template", info="Template to use for generating text.", advanced=True
         ),
+        BoolInput(
+            name="enable_structured_output",
+            display_name="Enable Structured Output",
+            info="Whether to enable structured output in the model.",
+            value=False,
+            advanced=False,
+            real_time_refresh=True,
+        ),
         *LCModelComponent.get_base_inputs(),
     ]
@@ -254,7 +263,7 @@ class ChatOllamaComponent(LCModelComponent):
             )
         try:
-            output_format = self._parse_format_field(self.format)
+            output_format = self._parse_format_field(self.format) if self.enable_structured_output else None
         except Exception as e:
             msg = f"Failed to parse the format field: {e}"
             raise ValueError(msg) from e
@@ -264,7 +273,7 @@ class ChatOllamaComponent(LCModelComponent):
             "base_url": transformed_base_url,
             "model": self.model_name,
             "mirostat": mirostat_value,
-            "format": output_format,
+            "format": output_format or None,
             "metadata": self.metadata,
             "tags": self.tags.split(",") if self.tags else None,
             "mirostat_eta": mirostat_eta,
@@ -319,6 +328,9 @@ class ChatOllamaComponent(LCModelComponent):
             return False
     async def update_build_config(self, build_config: dict, field_value: Any, field_name: str | None = None):
+        if field_name == "enable_structured_output":  # bind enable_structured_output boolean to format show value
+            build_config["format"]["show"] = field_value
         if field_name == "mirostat":
             if field_value == "Disabled":
                 build_config["mirostat_eta"]["advanced"] = True
@@ -338,10 +350,17 @@ class ChatOllamaComponent(LCModelComponent):
                     build_config["mirostat_tau"]["value"] = 5
         if field_name in {"model_name", "base_url", "tool_model_enabled"}:
-            if await self.is_valid_ollama_url(self.base_url):
+            # Use field_value if base_url is being updated, otherwise use self.base_url
+            base_url_to_check = field_value if field_name == "base_url" else self.base_url
+            # Fallback to self.base_url if field_value is None or empty
+            if not base_url_to_check and field_name == "base_url":
+                base_url_to_check = self.base_url
+            logger.warning(f"Fetching Ollama models from updated URL: {base_url_to_check}")
+            if base_url_to_check and await self.is_valid_ollama_url(base_url_to_check):
                 tool_model_enabled = build_config["tool_model_enabled"].get("value", False) or self.tool_model_enabled
                 build_config["model_name"]["options"] = await self.get_models(
-                    self.base_url, tool_model_enabled=tool_model_enabled
+                    base_url_to_check, tool_model_enabled=tool_model_enabled
                 )
             else:
                 build_config["model_name"]["options"] = []

lfx/components/processing/__init__.py CHANGED Viewed

@@ -7,98 +7,47 @@ from typing import TYPE_CHECKING, Any
 from lfx.components._importing import import_mod
 if TYPE_CHECKING:
-    from lfx.components.processing.alter_metadata import AlterMetadataComponent
-    from lfx.components.processing.batch_run import BatchRunComponent
     from lfx.components.processing.combine_text import CombineTextComponent
     from lfx.components.processing.converter import TypeConverterComponent
-    from lfx.components.processing.create_data import CreateDataComponent
+    from lfx.components.processing.create_list import CreateListComponent
     from lfx.components.processing.data_operations import DataOperationsComponent
-    from lfx.components.processing.data_to_dataframe import DataToDataFrameComponent
     from lfx.components.processing.dataframe_operations import DataFrameOperationsComponent
-    from lfx.components.processing.dataframe_to_toolset import DataFrameToToolsetComponent
-    from lfx.components.processing.dynamic_create_data import DynamicCreateDataComponent
-    from lfx.components.processing.extract_key import ExtractDataKeyComponent
-    from lfx.components.processing.filter_data import FilterDataComponent
-    from lfx.components.processing.filter_data_values import DataFilterComponent
     from lfx.components.processing.json_cleaner import JSONCleaner
-    from lfx.components.processing.lambda_filter import LambdaFilterComponent
-    from lfx.components.processing.llm_router import LLMRouterComponent
-    from lfx.components.processing.merge_data import MergeDataComponent
-    from lfx.components.processing.message_to_data import MessageToDataComponent
+    from lfx.components.processing.output_parser import OutputParserComponent
     from lfx.components.processing.parse_data import ParseDataComponent
-    from lfx.components.processing.parse_dataframe import ParseDataFrameComponent
-    from lfx.components.processing.parse_json_data import ParseJSONDataComponent
     from lfx.components.processing.parser import ParserComponent
-    from lfx.components.processing.prompt import PromptComponent
-    from lfx.components.processing.python_repl_core import PythonREPLComponent
     from lfx.components.processing.regex import RegexExtractorComponent
-    from lfx.components.processing.select_data import SelectDataComponent
     from lfx.components.processing.split_text import SplitTextComponent
-    from lfx.components.processing.structured_output import StructuredOutputComponent
-    from lfx.components.processing.update_data import UpdateDataComponent
+    from lfx.components.processing.store_message import MessageStoreComponent
 _dynamic_imports = {
-    "AlterMetadataComponent": "alter_metadata",
-    "BatchRunComponent": "batch_run",
     "CombineTextComponent": "combine_text",
     "TypeConverterComponent": "converter",
-    "CreateDataComponent": "create_data",
+    "CreateListComponent": "create_list",
     "DataOperationsComponent": "data_operations",
-    "DataToDataFrameComponent": "data_to_dataframe",
     "DataFrameOperationsComponent": "dataframe_operations",
-    "DataFrameToToolsetComponent": "dataframe_to_toolset",
-    "DynamicCreateDataComponent": "dynamic_create_data",
-    "ExtractDataKeyComponent": "extract_key",
-    "FilterDataComponent": "filter_data",
-    "DataFilterComponent": "filter_data_values",
     "JSONCleaner": "json_cleaner",
-    "LambdaFilterComponent": "lambda_filter",
-    "LLMRouterComponent": "llm_router",
-    "MergeDataComponent": "merge_data",
-    "MessageToDataComponent": "message_to_data",
+    "OutputParserComponent": "output_parser",
     "ParseDataComponent": "parse_data",
-    "ParseDataFrameComponent": "parse_dataframe",
-    "ParseJSONDataComponent": "parse_json_data",
     "ParserComponent": "parser",
-    "PromptComponent": "prompt",
-    "PythonREPLComponent": "python_repl_core",
     "RegexExtractorComponent": "regex",
-    "SelectDataComponent": "select_data",
     "SplitTextComponent": "split_text",
-    "StructuredOutputComponent": "structured_output",
-    "UpdateDataComponent": "update_data",
+    "MessageStoreComponent": "store_message",
 }
 __all__ = [
-    "AlterMetadataComponent",
-    "BatchRunComponent",
     "CombineTextComponent",
-    "CreateDataComponent",
-    "DataFilterComponent",
+    "CreateListComponent",
     "DataFrameOperationsComponent",
-    "DataFrameToToolsetComponent",
     "DataOperationsComponent",
-    "DataToDataFrameComponent",
-    "DynamicCreateDataComponent",
-    "ExtractDataKeyComponent",
-    "FilterDataComponent",
     "JSONCleaner",
-    "LLMRouterComponent",
-    "LambdaFilterComponent",
-    "MergeDataComponent",
-    "MessageToDataComponent",
+    "MessageStoreComponent",
+    "OutputParserComponent",
     "ParseDataComponent",
-    "ParseDataFrameComponent",
-    "ParseJSONDataComponent",
     "ParserComponent",
-    "PromptComponent",
-    "PythonREPLComponent",
     "RegexExtractorComponent",
-    "SelectDataComponent",
     "SplitTextComponent",
-    "StructuredOutputComponent",
     "TypeConverterComponent",
-    "UpdateDataComponent",
 ]

lfx/components/processing/converter.py CHANGED Viewed

@@ -140,7 +140,7 @@ def _parse_csv_to_data(text: str) -> Data:
 class TypeConverterComponent(Component):
     display_name = "Type Convert"
     description = "Convert between different types (Message, Data, DataFrame)"
-    documentation: str = "https://docs.langflow.org/components-processing#type-convert"
+    documentation: str = "https://docs.langflow.org/type-convert"
     icon = "repeat"
     inputs = [

lfx/components/processing/dataframe_operations.py CHANGED Viewed

@@ -10,7 +10,7 @@ from lfx.schema.dataframe import DataFrame
 class DataFrameOperationsComponent(Component):
     display_name = "DataFrame Operations"
     description = "Perform various operations on a DataFrame."
-    documentation: str = "https://docs.langflow.org/components-processing#dataframe-operations"
+    documentation: str = "https://docs.langflow.org/dataframe-operations"
     icon = "table"
     name = "DataFrameOperations"

lfx/components/processing/parse_json_data.py CHANGED Viewed

@@ -84,8 +84,8 @@ class ParseJSONDataComponent(Component):
         full_filter_str = json.dumps(to_filter_as_dict)
-        logger.info("to_filter: ", to_filter)
+        logger.info("to_filter: %s", to_filter)
         results = jq.compile(self.query).input_text(full_filter_str).all()
-        logger.info("results: ", results)
+        logger.info("results: %s", results)
         return [Data(data=value) if isinstance(value, dict) else Data(text=str(value)) for value in results]

lfx/components/processing/parser.py CHANGED Viewed

@@ -10,7 +10,7 @@ from lfx.template.field.base import Output
 class ParserComponent(Component):
     display_name = "Parser"
     description = "Extracts text using a template."
-    documentation: str = "https://docs.langflow.org/components-processing#parser"
+    documentation: str = "https://docs.langflow.org/parser"
     icon = "braces"
     inputs = [

lfx/components/processing/split_text.py CHANGED Viewed

@@ -11,7 +11,7 @@ from lfx.utils.util import unescape_string
 class SplitTextComponent(Component):
     display_name: str = "Split Text"
     description: str = "Split text into chunks based on specified criteria."
-    documentation: str = "https://docs.langflow.org/components-processing#split-text"
+    documentation: str = "https://docs.langflow.org/split-text"
     icon = "scissors-line-dashed"
     name = "SplitText"

lfx/components/qdrant/qdrant.py CHANGED Viewed

@@ -1,5 +1,5 @@
-from langchain.embeddings.base import Embeddings
 from langchain_community.vectorstores import Qdrant
+from langchain_core.embeddings import Embeddings
 from lfx.base.vectorstores.model import LCVectorStoreComponent, check_cached_vector_store
 from lfx.helpers.data import docs_to_data

lfx/components/redis/redis.py CHANGED Viewed

@@ -1,7 +1,7 @@
 from pathlib import Path
-from langchain.text_splitter import CharacterTextSplitter
 from langchain_community.vectorstores.redis import Redis
+from langchain_text_splitters import CharacterTextSplitter
 from lfx.base.vectorstores.model import LCVectorStoreComponent, check_cached_vector_store
 from lfx.helpers.data import docs_to_data

lfx/components/twelvelabs/split_video.py CHANGED Viewed

@@ -9,6 +9,13 @@ from lfx.custom import Component
 from lfx.inputs import BoolInput, DropdownInput, HandleInput, IntInput
 from lfx.schema import Data
 from lfx.template import Output
+from lfx.utils.validate_cloud import raise_error_if_astra_cloud_disable_component
+disable_component_in_astra_cloud_msg = (
+    "Video processing is not supported in Astra cloud environment. "
+    "Video components require local file system access for processing. "
+    "Please use local storage mode or process videos locally before uploading."
+)
 class SplitVideoComponent(Component):
@@ -267,6 +274,9 @@ class SplitVideoComponent(Component):
     def process(self) -> list[Data]:
         """Process the input video and return a list of Data objects containing the clips."""
+        # Check if we're in Astra cloud environment and raise an error if we are.
+        raise_error_if_astra_cloud_disable_component(disable_component_in_astra_cloud_msg)
         try:
             # Get the input video path from the previous component
             if not hasattr(self, "videodata") or not isinstance(self.videodata, list) or len(self.videodata) != 1:

lfx/components/twelvelabs/video_file.py CHANGED Viewed

@@ -3,6 +3,13 @@ from pathlib import Path
 from lfx.base.data import BaseFileComponent
 from lfx.io import FileInput
 from lfx.schema import Data, DataFrame
+from lfx.utils.validate_cloud import raise_error_if_astra_cloud_disable_component
+disable_component_in_astra_cloud_msg = (
+    "Video processing is not supported in Astra cloud environment. "
+    "Video components require local file system access for processing. "
+    "Please use local storage mode or process videos locally before uploading."
+)
 class VideoFileComponent(BaseFileComponent):
@@ -97,6 +104,8 @@ class VideoFileComponent(BaseFileComponent):
     def process_files(self, file_list: list[BaseFileComponent.BaseFile]) -> list[BaseFileComponent.BaseFile]:
         """Process video files."""
+        # Check if we're in Astra cloud environment and raise an error if we are.
+        raise_error_if_astra_cloud_disable_component(disable_component_in_astra_cloud_msg)
         self.log(f"DEBUG: Processing video files: {len(file_list)}")
         if not file_list:
@@ -137,6 +146,9 @@ class VideoFileComponent(BaseFileComponent):
     def load_files(self) -> DataFrame:
         """Load video files and return a list of Data objects."""
+        # Check if we're in Astra cloud environment and raise an error if we are.
+        raise_error_if_astra_cloud_disable_component(disable_component_in_astra_cloud_msg)
         try:
             self.log("DEBUG: Starting video file load")
             if not hasattr(self, "file_path") or not self.file_path:

lfx/components/utilities/__init__.py ADDED Viewed

@@ -0,0 +1,43 @@
+from __future__ import annotations
+from typing import TYPE_CHECKING, Any
+from lfx.components._importing import import_mod
+if TYPE_CHECKING:
+    from lfx.components.utilities.calculator_core import CalculatorComponent
+    from lfx.components.utilities.current_date import CurrentDateComponent
+    from lfx.components.utilities.id_generator import IDGeneratorComponent
+    from lfx.components.utilities.python_repl_core import PythonREPLComponent
+_dynamic_imports = {
+    "CalculatorComponent": "calculator_core",
+    "CurrentDateComponent": "current_date",
+    "IDGeneratorComponent": "id_generator",
+    "PythonREPLComponent": "python_repl_core",
+}
+__all__ = [
+    "CalculatorComponent",
+    "CurrentDateComponent",
+    "IDGeneratorComponent",
+    "PythonREPLComponent",
+]
+def __getattr__(attr_name: str) -> Any:
+    """Lazily import utility components on attribute access."""
+    if attr_name not in _dynamic_imports:
+        msg = f"module '{__name__}' has no attribute '{attr_name}'"
+        raise AttributeError(msg)
+    try:
+        result = import_mod(attr_name, _dynamic_imports[attr_name], __spec__.parent)
+    except (ModuleNotFoundError, ImportError, AttributeError) as e:
+        msg = f"Could not import '{attr_name}' from '{__name__}': {e}"
+        raise AttributeError(msg) from e
+    globals()[attr_name] = result
+    return result
+def __dir__() -> list[str]:
+    return list(__all__)

lfx/components/{helpers → utilities}/calculator_core.py RENAMED Viewed

@@ -11,7 +11,7 @@ from lfx.schema.data import Data
 class CalculatorComponent(Component):
     display_name = "Calculator"
     description = "Perform basic arithmetic operations on a given expression."
-    documentation: str = "https://docs.langflow.org/components-helpers#calculator"
+    documentation: str = "https://docs.langflow.org/calculator"
     icon = "calculator"
     # Cache operators dictionary as a class variable

lfx/components/{helpers → utilities}/current_date.py RENAMED Viewed

@@ -10,7 +10,7 @@ from lfx.schema.message import Message
 class CurrentDateComponent(Component):
     display_name = "Current Date"
     description = "Returns the current date and time in the selected timezone."
-    documentation: str = "https://docs.langflow.org/components-helpers#current-date"
+    documentation: str = "https://docs.langflow.org/current-date"
     icon = "clock"
     name = "CurrentDate"

lfx/components/{processing → utilities}/python_repl_core.py RENAMED Viewed

@@ -10,7 +10,7 @@ from lfx.schema.data import Data
 class PythonREPLComponent(Component):
     display_name = "Python Interpreter"
     description = "Run Python code with optional imports. Use print() to see the output."
-    documentation: str = "https://docs.langflow.org/components-processing#python-interpreter"
+    documentation: str = "https://docs.langflow.org/python-interpreter"
     icon = "square-terminal"
     inputs = [

lfx/components/vectorstores/local_db.py CHANGED Viewed

@@ -12,6 +12,13 @@ from lfx.log.logger import logger
 from lfx.schema.data import Data
 from lfx.schema.dataframe import DataFrame
 from lfx.template.field.base import Output
+from lfx.utils.validate_cloud import raise_error_if_astra_cloud_disable_component
+disable_component_in_astra_cloud_msg = (
+    "Local vector stores are not supported in S3/cloud mode. "
+    "Local vector stores require local file system access for persistence. "
+    "Please use cloud-based vector stores (Pinecone, Weaviate, etc.) or local storage mode."
+)
 class LocalDBComponent(LCVectorStoreComponent):
@@ -193,6 +200,8 @@ class LocalDBComponent(LCVectorStoreComponent):
     @check_cached_vector_store
     def build_vector_store(self) -> Chroma:
         """Builds the Chroma object."""
+        raise_error_if_astra_cloud_disable_component(disable_component_in_astra_cloud_msg)
         try:
             from langchain_chroma import Chroma
         except ImportError as e:

lfx/components/youtube/youtube_transcripts.py CHANGED Viewed

@@ -1,7 +1,7 @@
+import re
 import pandas as pd
-import youtube_transcript_api
-from langchain_community.document_loaders import YoutubeLoader
-from langchain_community.document_loaders.youtube import TranscriptFormat
+from youtube_transcript_api import NoTranscriptFound, TranscriptsDisabled, YouTubeTranscriptApi
 from lfx.custom.custom_component.component import Component
 from lfx.inputs.inputs import DropdownInput, IntInput, MultilineInput
@@ -48,43 +48,133 @@ class YouTubeTranscriptsComponent(Component):
         Output(name="data_output", display_name="Transcript + Source", method="get_data_output"),
     ]
+    def _extract_video_id(self, url: str) -> str:
+        """Extract video ID from YouTube URL."""
+        patterns = [
+            r"(?:youtube\.com\/watch\?v=|youtu\.be\/|youtube\.com\/embed\/)([^&\n?#]+)",
+            r"youtube\.com\/watch\?.*?v=([^&\n?#]+)",
+        ]
+        for pattern in patterns:
+            match = re.search(pattern, url)
+            if match:
+                return match.group(1)
+        msg = f"Could not extract video ID from URL: {url}"
+        raise ValueError(msg)
     def _load_transcripts(self, *, as_chunks: bool = True):
         """Internal method to load transcripts from YouTube."""
-        loader = YoutubeLoader.from_youtube_url(
-            self.url,
-            transcript_format=TranscriptFormat.CHUNKS if as_chunks else TranscriptFormat.TEXT,
-            chunk_size_seconds=self.chunk_size_seconds,
-            translation=self.translation or None,
-        )
-        return loader.load()
+        try:
+            video_id = self._extract_video_id(self.url)
+        except ValueError as e:
+            msg = f"Invalid YouTube URL: {e}"
+            raise ValueError(msg) from e
+        try:
+            # Use new v1.0+ API - create instance
+            api = YouTubeTranscriptApi()
+            transcript_list = api.list(video_id)
+            # Get transcript in specified language or default to English
+            if self.translation:
+                # Get any available transcript and translate it
+                transcript = transcript_list.find_transcript(["en"])
+                transcript = transcript.translate(self.translation)
+            else:
+                # Try to get transcript in available languages
+                try:
+                    transcript = transcript_list.find_transcript(["en"])
+                except NoTranscriptFound:
+                    # Try auto-generated English
+                    transcript = transcript_list.find_generated_transcript(["en"])
+            # Fetch the transcript data
+            transcript_data = api.fetch(transcript.video_id, [transcript.language_code])
+        except (TranscriptsDisabled, NoTranscriptFound) as e:
+            error_type = type(e).__name__
+            msg = (
+                f"Could not retrieve transcripts for video '{video_id}'. "
+                "Possible reasons:\n"
+                "1. This video does not have captions/transcripts enabled\n"
+                "2. The video is private, restricted, or deleted\n"
+                f"\nTechnical error ({error_type}): {e}"
+            )
+            raise RuntimeError(msg) from e
+        except Exception as e:
+            error_type = type(e).__name__
+            msg = (
+                f"Could not retrieve transcripts for video '{video_id}'. "
+                "Possible reasons:\n"
+                "1. This video does not have captions/transcripts enabled\n"
+                "2. The video is private, restricted, or deleted\n"
+                "3. YouTube is blocking automated requests\n"
+                f"\nTechnical error ({error_type}): {e}"
+            )
+            raise RuntimeError(msg) from e
+        if as_chunks:
+            # Group into chunks based on chunk_size_seconds
+            return self._chunk_transcript(transcript_data)
+        # Return as continuous text
+        return transcript_data
+    def _chunk_transcript(self, transcript_data):
+        """Group transcript segments into time-based chunks."""
+        chunks = []
+        current_chunk = []
+        chunk_start = 0
+        for segment in transcript_data:
+            # Handle both dict (old API) and object (new API) formats
+            segment_start = segment.start if hasattr(segment, "start") else segment["start"]
+            # If this segment starts beyond the current chunk window, start a new chunk
+            if segment_start - chunk_start >= self.chunk_size_seconds and current_chunk:
+                chunk_text = " ".join(s.text if hasattr(s, "text") else s["text"] for s in current_chunk)
+                chunks.append({"start": chunk_start, "text": chunk_text})
+                current_chunk = []
+                chunk_start = segment_start
+            current_chunk.append(segment)
+        # Add the last chunk
+        if current_chunk:
+            chunk_text = " ".join(s.text if hasattr(s, "text") else s["text"] for s in current_chunk)
+            chunks.append({"start": chunk_start, "text": chunk_text})
+        return chunks
     def get_dataframe_output(self) -> DataFrame:
         """Provides transcript output as a DataFrame with timestamp and text columns."""
         try:
-            transcripts = self._load_transcripts(as_chunks=True)
+            chunks = self._load_transcripts(as_chunks=True)
             # Create DataFrame with timestamp and text columns
             data = []
-            for doc in transcripts:
-                start_seconds = int(doc.metadata["start_seconds"])
+            for chunk in chunks:
+                start_seconds = int(chunk["start"])
                 start_minutes = start_seconds // 60
-                start_seconds %= 60
-                timestamp = f"{start_minutes:02d}:{start_seconds:02d}"
-                data.append({"timestamp": timestamp, "text": doc.page_content})
+                start_seconds_remainder = start_seconds % 60
+                timestamp = f"{start_minutes:02d}:{start_seconds_remainder:02d}"
+                data.append({"timestamp": timestamp, "text": chunk["text"]})
             return DataFrame(pd.DataFrame(data))
-        except (youtube_transcript_api.TranscriptsDisabled, youtube_transcript_api.NoTranscriptFound) as exc:
-            return DataFrame(pd.DataFrame({"error": [f"Failed to get YouTube transcripts: {exc!s}"]}))
+        except (TranscriptsDisabled, NoTranscriptFound, RuntimeError, ValueError) as exc:
+            error_msg = f"Failed to get YouTube transcripts: {exc!s}"
+            return DataFrame(pd.DataFrame({"error": [error_msg]}))
     def get_message_output(self) -> Message:
         """Provides transcript output as continuous text."""
         try:
-            transcripts = self._load_transcripts(as_chunks=False)
-            result = transcripts[0].page_content
+            transcript_data = self._load_transcripts(as_chunks=False)
+            # Handle both dict (old API) and object (new API) formats
+            result = " ".join(
+                segment.text if hasattr(segment, "text") else segment["text"] for segment in transcript_data
+            )
             return Message(text=result)
-        except (youtube_transcript_api.TranscriptsDisabled, youtube_transcript_api.NoTranscriptFound) as exc:
+        except (TranscriptsDisabled, NoTranscriptFound, RuntimeError, ValueError) as exc:
             error_msg = f"Failed to get YouTube transcripts: {exc!s}"
             return Message(text=error_msg)
@@ -100,19 +190,17 @@ class YouTubeTranscriptsComponent(Component):
         default_data = {"transcript": "", "video_url": self.url, "error": None}
         try:
-            transcripts = self._load_transcripts(as_chunks=False)
-            if not transcripts:
+            transcript_data = self._load_transcripts(as_chunks=False)
+            if not transcript_data:
                 default_data["error"] = "No transcripts found."
                 return Data(data=default_data)
-            # Combine all transcript parts
-            full_transcript = " ".join(doc.page_content for doc in transcripts)
+            # Combine all transcript segments - handle both dict and object formats
+            full_transcript = " ".join(
+                segment.text if hasattr(segment, "text") else segment["text"] for segment in transcript_data
+            )
             return Data(data={"transcript": full_transcript, "video_url": self.url})
-        except (
-            youtube_transcript_api.TranscriptsDisabled,
-            youtube_transcript_api.NoTranscriptFound,
-            youtube_transcript_api.CouldNotRetrieveTranscript,
-        ) as exc:
+        except (TranscriptsDisabled, NoTranscriptFound, RuntimeError, ValueError) as exc:
             default_data["error"] = str(exc)
             return Data(data=default_data)

lfx-nightly 0.2.0.dev0__py3-none-any.whl → 0.2.0.dev41__py3-none-any.whl

lfx-nightly 0.2.0.dev0py3-none-any.whl → 0.2.0.dev41py3-none-any.whl