PyPI - lfx-nightly - Versions diffs - 0.1.13.dev0__py3-none-any.whl → 0.2.0.dev26__py3-none-any.whl - Mend

lfx-nightly 0.1.13.dev0py3-none-any.whl → 0.2.0.dev26py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (237) hide show

lfx/_assets/component_index.json +1 -1
lfx/base/agents/agent.py +121 -29
lfx/base/agents/altk_base_agent.py +380 -0
lfx/base/agents/altk_tool_wrappers.py +565 -0
lfx/base/agents/events.py +103 -35
lfx/base/agents/utils.py +15 -2
lfx/base/composio/composio_base.py +183 -233
lfx/base/data/base_file.py +88 -21
lfx/base/data/storage_utils.py +192 -0
lfx/base/data/utils.py +178 -14
lfx/base/datastax/__init__.py +5 -0
lfx/{components/vectorstores/astradb.py → base/datastax/astradb_base.py} +84 -473
lfx/base/embeddings/embeddings_class.py +113 -0
lfx/base/io/chat.py +5 -4
lfx/base/mcp/util.py +101 -15
lfx/base/models/groq_constants.py +74 -58
lfx/base/models/groq_model_discovery.py +265 -0
lfx/base/models/model.py +1 -1
lfx/base/models/model_input_constants.py +74 -7
lfx/base/models/model_utils.py +100 -0
lfx/base/models/ollama_constants.py +3 -0
lfx/base/models/openai_constants.py +7 -0
lfx/base/models/watsonx_constants.py +36 -0
lfx/base/tools/run_flow.py +601 -129
lfx/cli/commands.py +7 -4
lfx/cli/common.py +2 -2
lfx/cli/run.py +1 -1
lfx/cli/script_loader.py +53 -11
lfx/components/Notion/create_page.py +1 -1
lfx/components/Notion/list_database_properties.py +1 -1
lfx/components/Notion/list_pages.py +1 -1
lfx/components/Notion/list_users.py +1 -1
lfx/components/Notion/page_content_viewer.py +1 -1
lfx/components/Notion/search.py +1 -1
lfx/components/Notion/update_page_property.py +1 -1
lfx/components/__init__.py +19 -5
lfx/components/altk/__init__.py +34 -0
lfx/components/altk/altk_agent.py +193 -0
lfx/components/amazon/amazon_bedrock_converse.py +1 -1
lfx/components/apify/apify_actor.py +4 -4
lfx/components/composio/__init__.py +70 -18
lfx/components/composio/apollo_composio.py +11 -0
lfx/components/composio/bitbucket_composio.py +11 -0
lfx/components/composio/canva_composio.py +11 -0
lfx/components/composio/coda_composio.py +11 -0
lfx/components/composio/composio_api.py +10 -0
lfx/components/composio/discord_composio.py +1 -1
lfx/components/composio/elevenlabs_composio.py +11 -0
lfx/components/composio/exa_composio.py +11 -0
lfx/components/composio/firecrawl_composio.py +11 -0
lfx/components/composio/fireflies_composio.py +11 -0
lfx/components/composio/gmail_composio.py +1 -1
lfx/components/composio/googlebigquery_composio.py +11 -0
lfx/components/composio/googlecalendar_composio.py +1 -1
lfx/components/composio/googledocs_composio.py +1 -1
lfx/components/composio/googlemeet_composio.py +1 -1
lfx/components/composio/googlesheets_composio.py +1 -1
lfx/components/composio/googletasks_composio.py +1 -1
lfx/components/composio/heygen_composio.py +11 -0
lfx/components/composio/mem0_composio.py +11 -0
lfx/components/composio/peopledatalabs_composio.py +11 -0
lfx/components/composio/perplexityai_composio.py +11 -0
lfx/components/composio/serpapi_composio.py +11 -0
lfx/components/composio/slack_composio.py +3 -574
lfx/components/composio/slackbot_composio.py +1 -1
lfx/components/composio/snowflake_composio.py +11 -0
lfx/components/composio/tavily_composio.py +11 -0
lfx/components/composio/youtube_composio.py +2 -2
lfx/components/{agents → cuga}/__init__.py +5 -7
lfx/components/cuga/cuga_agent.py +730 -0
lfx/components/data/__init__.py +78 -28
lfx/components/data_source/__init__.py +58 -0
lfx/components/{data → data_source}/api_request.py +26 -3
lfx/components/{data → data_source}/csv_to_data.py +15 -10
lfx/components/{data → data_source}/json_to_data.py +15 -8
lfx/components/{data → data_source}/news_search.py +1 -1
lfx/components/{data → data_source}/rss.py +1 -1
lfx/components/{data → data_source}/sql_executor.py +1 -1
lfx/components/{data → data_source}/url.py +1 -1
lfx/components/{data → data_source}/web_search.py +1 -1
lfx/components/datastax/__init__.py +12 -6
lfx/components/datastax/{astra_assistant_manager.py → astradb_assistant_manager.py} +1 -0
lfx/components/datastax/astradb_chatmemory.py +40 -0
lfx/components/datastax/astradb_cql.py +6 -32
lfx/components/datastax/astradb_graph.py +10 -124
lfx/components/datastax/astradb_tool.py +13 -53
lfx/components/datastax/astradb_vectorstore.py +134 -977
lfx/components/datastax/create_assistant.py +1 -0
lfx/components/datastax/create_thread.py +1 -0
lfx/components/datastax/dotenv.py +1 -0
lfx/components/datastax/get_assistant.py +1 -0
lfx/components/datastax/getenvvar.py +1 -0
lfx/components/datastax/graph_rag.py +1 -1
lfx/components/datastax/hcd.py +1 -1
lfx/components/datastax/list_assistants.py +1 -0
lfx/components/datastax/run.py +1 -0
lfx/components/deactivated/json_document_builder.py +1 -1
lfx/components/elastic/elasticsearch.py +1 -1
lfx/components/elastic/opensearch_multimodal.py +1575 -0
lfx/components/files_and_knowledge/__init__.py +47 -0
lfx/components/{data → files_and_knowledge}/directory.py +1 -1
lfx/components/{data → files_and_knowledge}/file.py +246 -18
lfx/components/{knowledge_bases → files_and_knowledge}/ingestion.py +17 -9
lfx/components/{knowledge_bases → files_and_knowledge}/retrieval.py +18 -10
lfx/components/{data → files_and_knowledge}/save_file.py +142 -22
lfx/components/flow_controls/__init__.py +58 -0
lfx/components/{logic → flow_controls}/conditional_router.py +1 -1
lfx/components/{logic → flow_controls}/loop.py +47 -9
lfx/components/flow_controls/run_flow.py +108 -0
lfx/components/glean/glean_search_api.py +1 -1
lfx/components/groq/groq.py +35 -28
lfx/components/helpers/__init__.py +102 -0
lfx/components/ibm/watsonx.py +25 -21
lfx/components/input_output/__init__.py +3 -1
lfx/components/input_output/chat.py +12 -3
lfx/components/input_output/chat_output.py +12 -4
lfx/components/input_output/text.py +1 -1
lfx/components/input_output/text_output.py +1 -1
lfx/components/{data → input_output}/webhook.py +1 -1
lfx/components/knowledge_bases/__init__.py +59 -4
lfx/components/langchain_utilities/character.py +1 -1
lfx/components/langchain_utilities/csv_agent.py +84 -16
lfx/components/langchain_utilities/json_agent.py +67 -12
lfx/components/langchain_utilities/language_recursive.py +1 -1
lfx/components/llm_operations/__init__.py +46 -0
lfx/components/{processing → llm_operations}/batch_run.py +1 -1
lfx/components/{processing → llm_operations}/lambda_filter.py +1 -1
lfx/components/{logic → llm_operations}/llm_conditional_router.py +1 -1
lfx/components/{processing/llm_router.py → llm_operations/llm_selector.py} +3 -3
lfx/components/{processing → llm_operations}/structured_output.py +56 -18
lfx/components/logic/__init__.py +126 -0
lfx/components/mem0/mem0_chat_memory.py +11 -0
lfx/components/mistral/mistral_embeddings.py +1 -1
lfx/components/models/__init__.py +64 -9
lfx/components/models_and_agents/__init__.py +49 -0
lfx/components/{agents → models_and_agents}/agent.py +49 -6
lfx/components/models_and_agents/embedding_model.py +423 -0
lfx/components/models_and_agents/language_model.py +398 -0
lfx/components/{agents → models_and_agents}/mcp_component.py +84 -45
lfx/components/{helpers → models_and_agents}/memory.py +1 -1
lfx/components/nvidia/system_assist.py +1 -1
lfx/components/olivya/olivya.py +1 -1
lfx/components/ollama/ollama.py +235 -14
lfx/components/openrouter/openrouter.py +49 -147
lfx/components/processing/__init__.py +9 -57
lfx/components/processing/converter.py +1 -1
lfx/components/processing/dataframe_operations.py +1 -1
lfx/components/processing/parse_json_data.py +2 -2
lfx/components/processing/parser.py +7 -2
lfx/components/processing/split_text.py +1 -1
lfx/components/qdrant/qdrant.py +1 -1
lfx/components/redis/redis.py +1 -1
lfx/components/twelvelabs/split_video.py +10 -0
lfx/components/twelvelabs/video_file.py +12 -0
lfx/components/utilities/__init__.py +43 -0
lfx/components/{helpers → utilities}/calculator_core.py +1 -1
lfx/components/{helpers → utilities}/current_date.py +1 -1
lfx/components/{processing → utilities}/python_repl_core.py +1 -1
lfx/components/vectorstores/__init__.py +0 -6
lfx/components/vectorstores/local_db.py +9 -0
lfx/components/youtube/youtube_transcripts.py +118 -30
lfx/custom/custom_component/component.py +60 -3
lfx/custom/custom_component/custom_component.py +68 -6
lfx/field_typing/constants.py +1 -0
lfx/graph/edge/base.py +45 -22
lfx/graph/graph/base.py +5 -2
lfx/graph/graph/schema.py +3 -2
lfx/graph/state/model.py +15 -2
lfx/graph/utils.py +6 -0
lfx/graph/vertex/base.py +4 -1
lfx/graph/vertex/param_handler.py +10 -7
lfx/graph/vertex/vertex_types.py +1 -1
lfx/helpers/__init__.py +12 -0
lfx/helpers/flow.py +117 -0
lfx/inputs/input_mixin.py +24 -1
lfx/inputs/inputs.py +13 -1
lfx/interface/components.py +161 -83
lfx/io/schema.py +6 -0
lfx/log/logger.py +5 -3
lfx/schema/schema.py +5 -0
lfx/services/database/__init__.py +5 -0
lfx/services/database/service.py +25 -0
lfx/services/deps.py +87 -22
lfx/services/manager.py +19 -6
lfx/services/mcp_composer/service.py +998 -157
lfx/services/session.py +5 -0
lfx/services/settings/base.py +51 -7
lfx/services/settings/constants.py +8 -0
lfx/services/storage/local.py +76 -46
lfx/services/storage/service.py +152 -29
lfx/template/field/base.py +3 -0
lfx/utils/ssrf_protection.py +384 -0
lfx/utils/validate_cloud.py +26 -0
{lfx_nightly-0.1.13.dev0.dist-info → lfx_nightly-0.2.0.dev26.dist-info}/METADATA +38 -22
{lfx_nightly-0.1.13.dev0.dist-info → lfx_nightly-0.2.0.dev26.dist-info}/RECORD +210 -196
{lfx_nightly-0.1.13.dev0.dist-info → lfx_nightly-0.2.0.dev26.dist-info}/WHEEL +1 -1
lfx/components/agents/cuga_agent.py +0 -1013
lfx/components/datastax/astra_db.py +0 -77
lfx/components/datastax/cassandra.py +0 -92
lfx/components/logic/run_flow.py +0 -71
lfx/components/models/embedding_model.py +0 -114
lfx/components/models/language_model.py +0 -144
lfx/components/vectorstores/astradb_graph.py +0 -326
lfx/components/vectorstores/cassandra.py +0 -264
lfx/components/vectorstores/cassandra_graph.py +0 -238
lfx/components/vectorstores/chroma.py +0 -167
lfx/components/vectorstores/clickhouse.py +0 -135
lfx/components/vectorstores/couchbase.py +0 -102
lfx/components/vectorstores/elasticsearch.py +0 -267
lfx/components/vectorstores/faiss.py +0 -111
lfx/components/vectorstores/graph_rag.py +0 -141
lfx/components/vectorstores/hcd.py +0 -314
lfx/components/vectorstores/milvus.py +0 -115
lfx/components/vectorstores/mongodb_atlas.py +0 -213
lfx/components/vectorstores/opensearch.py +0 -243
lfx/components/vectorstores/pgvector.py +0 -72
lfx/components/vectorstores/pinecone.py +0 -134
lfx/components/vectorstores/qdrant.py +0 -109
lfx/components/vectorstores/supabase.py +0 -76
lfx/components/vectorstores/upstash.py +0 -124
lfx/components/vectorstores/vectara.py +0 -97
lfx/components/vectorstores/vectara_rag.py +0 -164
lfx/components/vectorstores/weaviate.py +0 -89
/lfx/components/{data → data_source}/mock_data.py +0 -0
/lfx/components/datastax/{astra_vectorize.py → astradb_vectorize.py} +0 -0
/lfx/components/{logic → flow_controls}/data_conditional_router.py +0 -0
/lfx/components/{logic → flow_controls}/flow_tool.py +0 -0
/lfx/components/{logic → flow_controls}/listen.py +0 -0
/lfx/components/{logic → flow_controls}/notify.py +0 -0
/lfx/components/{logic → flow_controls}/pass_message.py +0 -0
/lfx/components/{logic → flow_controls}/sub_flow.py +0 -0
/lfx/components/{processing → models_and_agents}/prompt.py +0 -0
/lfx/components/{helpers → processing}/create_list.py +0 -0
/lfx/components/{helpers → processing}/output_parser.py +0 -0
/lfx/components/{helpers → processing}/store_message.py +0 -0
/lfx/components/{helpers → utilities}/id_generator.py +0 -0
{lfx_nightly-0.1.13.dev0.dist-info → lfx_nightly-0.2.0.dev26.dist-info}/entry_points.txt +0 -0

lfx/components/datastax/astradb_vectorstore.py CHANGED Viewed

@@ -1,191 +1,27 @@
-import re
-from collections import defaultdict
-from dataclasses import asdict, dataclass, field
-from astrapy import DataAPIClient, Database
-from astrapy.data.info.reranking import RerankServiceOptions
-from astrapy.info import CollectionDescriptor, CollectionLexicalOptions, CollectionRerankOptions
-from langchain_astradb import AstraDBVectorStore, VectorServiceOptions
-from langchain_astradb.utils.astradb import HybridSearchMode, _AstraDBCollectionEnvironment
+from astrapy import DataAPIClient
 from langchain_core.documents import Document
+from lfx.base.datastax.astradb_base import AstraDBBaseComponent
 from lfx.base.vectorstores.model import LCVectorStoreComponent, check_cached_vector_store
 from lfx.base.vectorstores.vector_store_connection_decorator import vector_store_connection
 from lfx.helpers.data import docs_to_data
-from lfx.inputs.inputs import FloatInput, NestedDictInput
-from lfx.io import (
-    BoolInput,
-    DropdownInput,
-    HandleInput,
-    IntInput,
-    QueryInput,
-    SecretStrInput,
-    StrInput,
-)
+from lfx.io import BoolInput, DropdownInput, FloatInput, HandleInput, IntInput, NestedDictInput, QueryInput, StrInput
 from lfx.schema.data import Data
 from lfx.serialization import serialize
 from lfx.utils.version import get_version_info
 @vector_store_connection
-class AstraDBVectorStoreComponent(LCVectorStoreComponent):
+class AstraDBVectorStoreComponent(AstraDBBaseComponent, LCVectorStoreComponent):
     display_name: str = "Astra DB"
     description: str = "Ingest and search documents in Astra DB"
-    documentation: str = "https://docs.langflow.org/bundles-datastax#astra-db"
+    documentation: str = "https://docs.langflow.org/bundles-datastax"
     name = "AstraDB"
     icon: str = "AstraDB"
-    _cached_vector_store: AstraDBVectorStore | None = None
-    @dataclass
-    class NewDatabaseInput:
-        functionality: str = "create"
-        fields: dict[str, dict] = field(
-            default_factory=lambda: {
-                "data": {
-                    "node": {
-                        "name": "create_database",
-                        "description": "Please allow several minutes for creation to complete.",
-                        "display_name": "Create new database",
-                        "field_order": ["01_new_database_name", "02_cloud_provider", "03_region"],
-                        "template": {
-                            "01_new_database_name": StrInput(
-                                name="new_database_name",
-                                display_name="Name",
-                                info="Name of the new database to create in Astra DB.",
-                                required=True,
-                            ),
-                            "02_cloud_provider": DropdownInput(
-                                name="cloud_provider",
-                                display_name="Cloud provider",
-                                info="Cloud provider for the new database.",
-                                options=[],
-                                required=True,
-                                real_time_refresh=True,
-                            ),
-                            "03_region": DropdownInput(
-                                name="region",
-                                display_name="Region",
-                                info="Region for the new database.",
-                                options=[],
-                                required=True,
-                            ),
-                        },
-                    },
-                }
-            }
-        )
-    @dataclass
-    class NewCollectionInput:
-        functionality: str = "create"
-        fields: dict[str, dict] = field(
-            default_factory=lambda: {
-                "data": {
-                    "node": {
-                        "name": "create_collection",
-                        "description": "Please allow several seconds for creation to complete.",
-                        "display_name": "Create new collection",
-                        "field_order": [
-                            "01_new_collection_name",
-                            "02_embedding_generation_provider",
-                            "03_embedding_generation_model",
-                            "04_dimension",
-                        ],
-                        "template": {
-                            "01_new_collection_name": StrInput(
-                                name="new_collection_name",
-                                display_name="Name",
-                                info="Name of the new collection to create in Astra DB.",
-                                required=True,
-                            ),
-                            "02_embedding_generation_provider": DropdownInput(
-                                name="embedding_generation_provider",
-                                display_name="Embedding generation method",
-                                info="Provider to use for generating embeddings.",
-                                helper_text=(
-                                    "To create collections with more embedding provider options, go to "
-                                    '<a class="underline" href="https://astra.datastax.com/" target=" _blank" '
-                                    'rel="noopener noreferrer">your database in Astra DB</a>'
-                                ),
-                                real_time_refresh=True,
-                                required=True,
-                                options=[],
-                            ),
-                            "03_embedding_generation_model": DropdownInput(
-                                name="embedding_generation_model",
-                                display_name="Embedding model",
-                                info="Model to use for generating embeddings.",
-                                real_time_refresh=True,
-                                options=[],
-                            ),
-                            "04_dimension": IntInput(
-                                name="dimension",
-                                display_name="Dimensions",
-                                info="Dimensions of the embeddings to generate.",
-                                value=None,
-                            ),
-                        },
-                    },
-                }
-            }
-        )
     inputs = [
-        SecretStrInput(
-            name="token",
-            display_name="Astra DB Application Token",
-            info="Authentication token for accessing Astra DB.",
-            value="ASTRA_DB_APPLICATION_TOKEN",
-            required=True,
-            real_time_refresh=True,
-            input_types=[],
-        ),
-        DropdownInput(
-            name="environment",
-            display_name="Environment",
-            info="The environment for the Astra DB API Endpoint.",
-            options=["prod", "test", "dev"],
-            value="prod",
-            advanced=True,
-            real_time_refresh=True,
-            combobox=True,
-        ),
-        DropdownInput(
-            name="database_name",
-            display_name="Database",
-            info="The Database name for the Astra DB instance.",
-            required=True,
-            refresh_button=True,
-            real_time_refresh=True,
-            dialog_inputs=asdict(NewDatabaseInput()),
-            combobox=True,
-        ),
-        DropdownInput(
-            name="api_endpoint",
-            display_name="Astra DB API Endpoint",
-            info="The API Endpoint for the Astra DB instance. Supercedes database selection.",
-            advanced=True,
-        ),
-        DropdownInput(
-            name="keyspace",
-            display_name="Keyspace",
-            info="Optional keyspace within Astra DB to use for the collection.",
-            advanced=True,
-            options=[],
-            real_time_refresh=True,
-        ),
-        DropdownInput(
-            name="collection_name",
-            display_name="Collection",
-            info="The name of the collection within Astra DB where the vectors will be stored.",
-            required=True,
-            refresh_button=True,
-            real_time_refresh=True,
-            dialog_inputs=asdict(NewCollectionInput()),
-            combobox=True,
-            show=False,
-        ),
+        *AstraDBBaseComponent.inputs,
+        *LCVectorStoreComponent.inputs,
         HandleInput(
             name="embedding_model",
             display_name="Embedding Model",
@@ -194,7 +30,32 @@ class AstraDBVectorStoreComponent(LCVectorStoreComponent):
             required=False,
             show=True,
         ),
-        *LCVectorStoreComponent.inputs,
+        StrInput(
+            name="content_field",
+            display_name="Content Field",
+            info="Field to use as the text content field for the vector store.",
+            advanced=True,
+        ),
+        StrInput(
+            name="deletion_field",
+            display_name="Deletion Based On Field",
+            info="When this parameter is provided, documents in the target collection with "
+            "metadata field values matching the input metadata field value will be deleted "
+            "before new data is loaded.",
+            advanced=True,
+        ),
+        BoolInput(
+            name="ignore_invalid_documents",
+            display_name="Ignore Invalid Documents",
+            info="Boolean flag to determine whether to ignore invalid documents at runtime.",
+            advanced=True,
+        ),
+        NestedDictInput(
+            name="astradb_vectorstore_kwargs",
+            display_name="AstraDBVectorStore Parameters",
+            info="Optional dictionary of additional parameters for the AstraDBVectorStore.",
+            advanced=True,
+        ),
         DropdownInput(
             name="search_method",
             display_name="Search Method",
@@ -254,856 +115,152 @@ class AstraDBVectorStoreComponent(LCVectorStoreComponent):
             info="Optional dictionary of filters to apply to the search query.",
             advanced=True,
         ),
-        BoolInput(
-            name="autodetect_collection",
-            display_name="Autodetect Collection",
-            info="Boolean flag to determine whether to autodetect the collection.",
-            advanced=True,
-            value=True,
-        ),
-        StrInput(
-            name="content_field",
-            display_name="Content Field",
-            info="Field to use as the text content field for the vector store.",
-            advanced=True,
-        ),
-        StrInput(
-            name="deletion_field",
-            display_name="Deletion Based On Field",
-            info="When this parameter is provided, documents in the target collection with "
-            "metadata field values matching the input metadata field value will be deleted "
-            "before new data is loaded.",
-            advanced=True,
-        ),
-        BoolInput(
-            name="ignore_invalid_documents",
-            display_name="Ignore Invalid Documents",
-            info="Boolean flag to determine whether to ignore invalid documents at runtime.",
-            advanced=True,
-        ),
-        NestedDictInput(
-            name="astradb_vectorstore_kwargs",
-            display_name="AstraDBVectorStore Parameters",
-            info="Optional dictionary of additional parameters for the AstraDBVectorStore.",
-            advanced=True,
-        ),
     ]
-    @classmethod
-    def map_cloud_providers(cls):
-        # TODO: Programmatically fetch the regions for each cloud provider
-        return {
-            "dev": {
-                "Amazon Web Services": {
-                    "id": "aws",
-                    "regions": ["us-west-2"],
-                },
-                "Google Cloud Platform": {
-                    "id": "gcp",
-                    "regions": ["us-central1", "europe-west4"],
-                },
-            },
-            "test": {
-                "Google Cloud Platform": {
-                    "id": "gcp",
-                    "regions": ["us-central1"],
-                },
-            },
-            "prod": {
-                "Amazon Web Services": {
-                    "id": "aws",
-                    "regions": ["us-east-2", "ap-south-1", "eu-west-1"],
-                },
-                "Google Cloud Platform": {
-                    "id": "gcp",
-                    "regions": ["us-east1"],
-                },
-                "Microsoft Azure": {
-                    "id": "azure",
-                    "regions": ["westus3"],
-                },
-            },
-        }
-    @classmethod
-    def get_vectorize_providers(cls, token: str, environment: str | None = None, api_endpoint: str | None = None):
-        try:
-            # Get the admin object
-            client = DataAPIClient(environment=environment)
-            admin_client = client.get_admin()
-            db_admin = admin_client.get_database_admin(api_endpoint, token=token)
-            # Get the list of embedding providers
-            embedding_providers = db_admin.find_embedding_providers()
-            vectorize_providers_mapping = {}
-            # Map the provider display name to the provider key and models
-            for provider_key, provider_data in embedding_providers.embedding_providers.items():
-                # Get the provider display name and models
-                display_name = provider_data.display_name
-                models = [model.name for model in provider_data.models]
-                # Build our mapping
-                vectorize_providers_mapping[display_name] = [provider_key, models]
-            # Sort the resulting dictionary
-            return defaultdict(list, dict(sorted(vectorize_providers_mapping.items())))
-        except Exception as _:  # noqa: BLE001
-            return {}
-    @classmethod
-    async def create_database_api(
-        cls,
-        new_database_name: str,
-        cloud_provider: str,
-        region: str,
-        token: str,
-        environment: str | None = None,
-        keyspace: str | None = None,
-    ):
-        client = DataAPIClient(environment=environment)
-        # Get the admin object
-        admin_client = client.get_admin(token=token)
-        # Get the environment, set to prod if null like
-        my_env = environment or "prod"
-        # Raise a value error if name isn't provided
-        if not new_database_name:
-            msg = "Database name is required to create a new database."
-            raise ValueError(msg)
-        # Call the create database function
-        return await admin_client.async_create_database(
-            name=new_database_name,
-            cloud_provider=cls.map_cloud_providers()[my_env][cloud_provider]["id"],
-            region=region,
-            keyspace=keyspace,
-            wait_until_active=False,
-        )
-    @classmethod
-    async def create_collection_api(
-        cls,
-        new_collection_name: str,
-        token: str,
-        api_endpoint: str,
-        environment: str | None = None,
-        keyspace: str | None = None,
-        dimension: int | None = None,
-        embedding_generation_provider: str | None = None,
-        embedding_generation_model: str | None = None,
-        reranker: str | None = None,
-    ):
-        # Build vectorize options, if needed
-        vectorize_options = None
-        if not dimension:
-            providers = cls.get_vectorize_providers(token=token, environment=environment, api_endpoint=api_endpoint)
-            vectorize_options = VectorServiceOptions(
-                provider=providers.get(embedding_generation_provider, [None, []])[0],
-                model_name=embedding_generation_model,
-            )
-        # Raise a value error if name isn't provided
-        if not new_collection_name:
-            msg = "Collection name is required to create a new collection."
-            raise ValueError(msg)
-        # Define the base arguments being passed to the create collection function
-        base_args = {
-            "collection_name": new_collection_name,
-            "token": token,
-            "api_endpoint": api_endpoint,
-            "keyspace": keyspace,
-            "environment": environment,
-            "embedding_dimension": dimension,
-            "collection_vector_service_options": vectorize_options,
-        }
-        # Add optional arguments if the reranker is set
-        if reranker:
-            # Split the reranker field into a provider a model name
-            provider, _ = reranker.split("/")
-            base_args["collection_rerank"] = CollectionRerankOptions(
-                service=RerankServiceOptions(provider=provider, model_name=reranker),
-            )
-            base_args["collection_lexical"] = CollectionLexicalOptions(analyzer="STANDARD")
-        _AstraDBCollectionEnvironment(**base_args)
-    @classmethod
-    def get_database_list_static(cls, token: str, environment: str | None = None):
-        client = DataAPIClient(environment=environment)
-        # Get the admin object
-        admin_client = client.get_admin(token=token)
-        # Get the list of databases
-        db_list = admin_client.list_databases()
-        # Generate the api endpoint for each database
-        db_info_dict = {}
-        for db in db_list:
-            try:
-                # Get the API endpoint for the database
-                api_endpoints = [db_reg.api_endpoint for db_reg in db.regions]
-                # Get the number of collections
-                try:
-                    # Get the number of collections in the database
-                    num_collections = len(
-                        client.get_database(
-                            api_endpoints[0],
-                            token=token,
-                        ).list_collection_names()
-                    )
-                except Exception:  # noqa: BLE001
-                    if db.status != "PENDING":
-                        continue
-                    num_collections = 0
-                # Add the database to the dictionary
-                db_info_dict[db.name] = {
-                    "api_endpoints": api_endpoints,
-                    "keyspaces": db.keyspaces,
-                    "collections": num_collections,
-                    "status": db.status if db.status != "ACTIVE" else None,
-                    "org_id": db.org_id if db.org_id else None,
-                }
-            except Exception:  # noqa: BLE001
-                pass
-        return db_info_dict
-    def get_database_list(self):
-        return self.get_database_list_static(
-            token=self.token,
-            environment=self.environment,
-        )
-    @classmethod
-    def get_api_endpoint_static(
-        cls,
-        token: str,
-        environment: str | None = None,
-        api_endpoint: str | None = None,
-        database_name: str | None = None,
-    ):
-        # If the api_endpoint is set, return it
-        if api_endpoint:
-            return api_endpoint
-        # Check if the database_name is like a url
-        if database_name and database_name.startswith("https://"):
-            return database_name
-        # If the database is not set, nothing we can do.
-        if not database_name:
-            return None
-        # Grab the database object
-        db = cls.get_database_list_static(token=token, environment=environment).get(database_name)
-        if not db:
-            return None
-        # Otherwise, get the URL from the database list
-        endpoints = db.get("api_endpoints") or []
-        return endpoints[0] if endpoints else None
-    def get_api_endpoint(self):
-        return self.get_api_endpoint_static(
-            token=self.token,
-            environment=self.environment,
-            api_endpoint=self.api_endpoint,
-            database_name=self.database_name,
-        )
-    @classmethod
-    def get_database_id_static(cls, api_endpoint: str) -> str | None:
-        # Pattern matches standard UUID format: 8-4-4-4-12 hexadecimal characters
-        uuid_pattern = r"[0-9a-fA-F]{8}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{12}"
-        match = re.search(uuid_pattern, api_endpoint)
-        return match.group(0) if match else None
-    def get_database_id(self):
-        return self.get_database_id_static(api_endpoint=self.get_api_endpoint())
-    def get_keyspace(self):
-        keyspace = self.keyspace
-        if keyspace:
-            return keyspace.strip()
-        return "default_keyspace"
-    def get_database_object(self, api_endpoint: str | None = None):
-        try:
-            client = DataAPIClient(environment=self.environment)
-            return client.get_database(
-                api_endpoint or self.get_api_endpoint(),
-                token=self.token,
-                keyspace=self.get_keyspace(),
-            )
-        except Exception as e:
-            msg = f"Error fetching database object: {e}"
-            raise ValueError(msg) from e
-    def collection_data(self, collection_name: str, database: Database | None = None):
-        try:
-            if not database:
-                client = DataAPIClient(environment=self.environment)
-                database = client.get_database(
-                    self.get_api_endpoint(),
-                    token=self.token,
-                    keyspace=self.get_keyspace(),
-                )
-            collection = database.get_collection(collection_name)
-            return collection.estimated_document_count()
-        except Exception as e:  # noqa: BLE001
-            self.log(f"Error checking collection data: {e}")
-            return None
-    def _initialize_database_options(self):
-        try:
-            return [
-                {
-                    "name": name,
-                    "status": info["status"],
-                    "collections": info["collections"],
-                    "api_endpoints": info["api_endpoints"],
-                    "keyspaces": info["keyspaces"],
-                    "org_id": info["org_id"],
-                }
-                for name, info in self.get_database_list().items()
-            ]
-        except Exception as e:
-            msg = f"Error fetching database options: {e}"
-            raise ValueError(msg) from e
-    @classmethod
-    def get_provider_icon(cls, collection: CollectionDescriptor | None = None, provider_name: str | None = None) -> str:
-        # Get the provider name from the collection
-        provider_name = provider_name or (
-            collection.definition.vector.service.provider
-            if (
-                collection
-                and collection.definition
-                and collection.definition.vector
-                and collection.definition.vector.service
-            )
-            else None
+    async def update_build_config(
+        self,
+        build_config: dict,
+        field_value: str | dict,
+        field_name: str | None = None,
+    ) -> dict:
+        """Update build configuration with proper handling of embedding and search options."""
+        # Handle base astra db build config updates
+        build_config = await super().update_build_config(
+            build_config,
+            field_value=field_value,
+            field_name=field_name,
         )
-        # If there is no provider, use the vector store icon
-        if not provider_name or provider_name.lower() == "bring your own":
-            return "vectorstores"
-        # Map provider casings
-        case_map = {
-            "nvidia": "NVIDIA",
-            "openai": "OpenAI",
-            "amazon bedrock": "AmazonBedrockEmbeddings",
-            "azure openai": "AzureOpenAiEmbeddings",
-            "cohere": "Cohere",
-            "jina ai": "JinaAI",
-            "mistral ai": "MistralAI",
-            "upstage": "Upstage",
-            "voyage ai": "VoyageAI",
-        }
+        # Set embedding model display based on provider selection
+        if isinstance(field_value, dict) and "02_embedding_generation_provider" in field_value:
+            embedding_provider = field_value.get("02_embedding_generation_provider")
+            is_custom_provider = embedding_provider and embedding_provider != "Bring your own"
+            provider = embedding_provider.lower() if is_custom_provider and embedding_provider is not None else None
-        # Adjust the casing on some like nvidia
-        return case_map[provider_name.lower()] if provider_name.lower() in case_map else provider_name.title()
-    def _initialize_collection_options(self, api_endpoint: str | None = None):
-        # Nothing to generate if we don't have an API endpoint yet
-        api_endpoint = api_endpoint or self.get_api_endpoint()
-        if not api_endpoint:
-            return []
+            build_config["embedding_model"]["show"] = not bool(provider)
+            build_config["embedding_model"]["required"] = not bool(provider)
-        # Retrieve the database object
-        database = self.get_database_object(api_endpoint=api_endpoint)
-        # Get the list of collections
-        collection_list = database.list_collections(keyspace=self.get_keyspace())
-        # Return the list of collections and metadata associated
-        return [
-            {
-                "name": col.name,
-                "records": self.collection_data(collection_name=col.name, database=database),
-                "provider": (
-                    col.definition.vector.service.provider
-                    if col.definition.vector and col.definition.vector.service
-                    else None
-                ),
-                "icon": self.get_provider_icon(collection=col),
-                "model": (
-                    col.definition.vector.service.model_name
-                    if col.definition.vector and col.definition.vector.service
-                    else None
-                ),
-            }
-            for col in collection_list
-        ]
-    def reset_provider_options(self, build_config: dict) -> dict:
-        """Reset provider options and related configurations in the build_config dictionary."""
-        # Extract template path for cleaner access
-        template = build_config["collection_name"]["dialog_inputs"]["fields"]["data"]["node"]["template"]
-        # Get vectorize providers
-        vectorize_providers_api = self.get_vectorize_providers(
-            token=self.token,
-            environment=self.environment,
-            api_endpoint=build_config["api_endpoint"]["value"],
-        )
-        # Create a new dictionary with "Bring your own" first
-        vectorize_providers: dict[str, list[list[str]]] = {"Bring your own": [[], []]}
-        # Add the remaining items (only Nvidia) from the original dictionary
-        vectorize_providers.update(
-            {
-                k: v
-                for k, v in vectorize_providers_api.items()
-                if k.lower() in ["nvidia"]  # TODO: Eventually support more
-            }
-        )
-        # Set provider options
-        provider_field = "02_embedding_generation_provider"
-        template[provider_field]["options"] = list(vectorize_providers.keys())
-        # Add metadata for each provider option
-        template[provider_field]["options_metadata"] = [
-            {"icon": self.get_provider_icon(provider_name=provider)} for provider in template[provider_field]["options"]
-        ]
-        # Get selected embedding provider
-        embedding_provider = template[provider_field]["value"]
-        is_bring_your_own = embedding_provider and embedding_provider == "Bring your own"
-        # Configure embedding model field
-        model_field = "03_embedding_generation_model"
-        template[model_field].update(
-            {
-                "options": vectorize_providers.get(embedding_provider, [[], []])[1],
-                "placeholder": "Bring your own" if is_bring_your_own else None,
-                "readonly": is_bring_your_own,
-                "required": not is_bring_your_own,
-                "value": None,
-            }
-        )
-        # If this is a bring your own, set dimensions to 0
-        return self.reset_dimension_field(build_config)
+        # Early return if no API endpoint is configured
+        if not self.get_api_endpoint():
+            return build_config
-    def reset_dimension_field(self, build_config: dict) -> dict:
-        """Reset dimension field options based on provided configuration."""
-        # Extract template path for cleaner access
-        template = build_config["collection_name"]["dialog_inputs"]["fields"]["data"]["node"]["template"]
+        # Configure search method and related options
+        return self._configure_search_options(build_config)
-        # Get selected embedding model
-        provider_field = "02_embedding_generation_provider"
-        embedding_provider = template[provider_field]["value"]
-        is_bring_your_own = embedding_provider and embedding_provider == "Bring your own"
+    def _configure_search_options(self, build_config: dict) -> dict:
+        """Configure hybrid search, reranker, and vector search options."""
+        # Detect available hybrid search capabilities
+        hybrid_capabilities = self._detect_hybrid_capabilities()
-        # Configure dimension field
-        dimension_field = "04_dimension"
-        dimension_value = 1024 if not is_bring_your_own else None  # TODO: Dynamically figure this out
-        template[dimension_field].update(
-            {
-                "placeholder": dimension_value,
-                "value": dimension_value,
-                "readonly": not is_bring_your_own,
-                "required": is_bring_your_own,
-            }
-        )
-        return build_config
+        # Return if we haven't selected a collection
+        if not build_config["collection_name"]["options"] or not build_config["collection_name"]["value"]:
+            return build_config
-    def reset_collection_list(self, build_config: dict) -> dict:
-        """Reset collection list options based on provided configuration."""
         # Get collection options
-        collection_options = self._initialize_collection_options(api_endpoint=build_config["api_endpoint"]["value"])
-        # Update collection configuration
-        collection_config = build_config["collection_name"]
-        collection_config.update(
-            {
-                "options": [col["name"] for col in collection_options],
-                "options_metadata": [{k: v for k, v in col.items() if k != "name"} for col in collection_options],
-            }
-        )
-        # Reset selected collection if not in options
-        if collection_config["value"] not in collection_config["options"]:
-            collection_config["value"] = ""
+        collection_options = self._get_collection_options(build_config)
-        # Set advanced status based on database selection
-        collection_config["show"] = bool(build_config["database_name"]["value"])
+        # Get the selected collection index
+        index = build_config["collection_name"]["options"].index(build_config["collection_name"]["value"])
+        provider = build_config["collection_name"]["options_metadata"][index]["provider"]
+        build_config["embedding_model"]["show"] = not bool(provider)
+        build_config["embedding_model"]["required"] = not bool(provider)
-        return build_config
+        # Determine search configuration
+        is_vector_search = build_config["search_method"]["value"] == "Vector Search"
+        is_autodetect = build_config["autodetect_collection"]["value"]
-    def reset_database_list(self, build_config: dict) -> dict:
-        """Reset database list options and related configurations."""
-        # Get database options
-        database_options = self._initialize_database_options()
+        # Apply hybrid search configuration
+        if hybrid_capabilities["available"]:
+            build_config["search_method"]["show"] = True
+            build_config["search_method"]["options"] = ["Hybrid Search", "Vector Search"]
+            build_config["search_method"]["value"] = build_config["search_method"].get("value", "Hybrid Search")
-        # Update cloud provider options
-        env = self.environment
-        template = build_config["database_name"]["dialog_inputs"]["fields"]["data"]["node"]["template"]
-        template["02_cloud_provider"]["options"] = list(self.map_cloud_providers()[env].keys())
+            build_config["reranker"]["options"] = hybrid_capabilities["reranker_models"]
+            build_config["reranker"]["options_metadata"] = hybrid_capabilities["reranker_metadata"]
+            if hybrid_capabilities["reranker_models"]:
+                build_config["reranker"]["value"] = hybrid_capabilities["reranker_models"][0]
+        else:
+            build_config["search_method"]["show"] = False
+            build_config["search_method"]["options"] = ["Vector Search"]
+            build_config["search_method"]["value"] = "Vector Search"
+            build_config["reranker"]["options"] = []
+            build_config["reranker"]["options_metadata"] = []
-        # Update database configuration
-        database_config = build_config["database_name"]
-        database_config.update(
-            {
-                "options": [db["name"] for db in database_options],
-                "options_metadata": [{k: v for k, v in db.items() if k != "name"} for db in database_options],
-            }
+        # Configure reranker visibility and state
+        hybrid_enabled = (
+            collection_options["rerank_enabled"] and build_config["search_method"]["value"] == "Hybrid Search"
         )
-        # Reset selections if value not in options
-        if database_config["value"] not in database_config["options"]:
-            database_config["value"] = ""
-            build_config["api_endpoint"]["options"] = []
-            build_config["api_endpoint"]["value"] = ""
-            build_config["collection_name"]["show"] = False
+        build_config["reranker"]["show"] = hybrid_enabled
+        build_config["reranker"]["toggle_value"] = hybrid_enabled
+        build_config["reranker"]["toggle_disable"] = is_vector_search
-        # Set advanced status based on token presence
-        database_config["show"] = bool(build_config["token"]["value"])
-        return build_config
+        # Configure lexical terms
+        lexical_visible = collection_options["lexical_enabled"] and not is_vector_search
+        build_config["lexical_terms"]["show"] = lexical_visible
+        build_config["lexical_terms"]["value"] = "" if is_vector_search else build_config["lexical_terms"]["value"]
-    def reset_build_config(self, build_config: dict) -> dict:
-        """Reset all build configuration options to default empty state."""
-        # Reset database configuration
-        database_config = build_config["database_name"]
-        database_config.update({"options": [], "options_metadata": [], "value": "", "show": False})
-        build_config["api_endpoint"]["options"] = []
-        build_config["api_endpoint"]["value"] = ""
+        # Configure search type and score threshold
+        build_config["search_type"]["show"] = is_vector_search
+        build_config["search_score_threshold"]["show"] = is_vector_search
-        # Reset hybrid search options
-        build_config["reranker"]["options"] = []
-        build_config["reranker"]["value"] = ""
-        build_config["reranker"]["show"] = False
-        build_config["lexical_terms"]["value"] = ""
-        build_config["lexical_terms"]["show"] = False
-        # Reset collection configuration
-        collection_config = build_config["collection_name"]
-        collection_config.update({"options": [], "options_metadata": [], "value": "", "show": False})
+        # Force similarity search for hybrid mode or autodetect
+        if hybrid_enabled or is_autodetect:
+            build_config["search_type"]["value"] = "Similarity"
         return build_config
-    def _handle_hybrid_search_options(self, build_config: dict) -> dict:
-        """Set hybrid search options in the build configuration."""
-        # Detect what hybrid options are available
-        # Get the admin object
-        client = DataAPIClient(environment=self.environment)
+    def _detect_hybrid_capabilities(self) -> dict:
+        """Detect available hybrid search and reranking capabilities."""
+        environment = self.get_environment(self.environment)
+        client = DataAPIClient(environment=environment)
         admin_client = client.get_admin()
         db_admin = admin_client.get_database_admin(self.get_api_endpoint(), token=self.token)
-        # We will try to get the reranking providers to see if its hybrid emabled
         try:
             providers = db_admin.find_reranking_providers()
-            build_config["reranker"]["options"] = [
+            reranker_models = [
                 model.name for provider_data in providers.reranking_providers.values() for model in provider_data.models
             ]
-            build_config["reranker"]["options_metadata"] = [
+            reranker_metadata = [
                 {"icon": self.get_provider_icon(provider_name=model.name.split("/")[0])}
                 for provider in providers.reranking_providers.values()
                 for model in provider.models
             ]
-            build_config["reranker"]["value"] = build_config["reranker"]["options"][0]
-            # Set the default search field to hybrid search
-            build_config["search_method"]["show"] = True
-            build_config["search_method"]["options"] = ["Hybrid Search", "Vector Search"]
-            build_config["search_method"]["value"] = "Hybrid Search"
-        except Exception as _:  # noqa: BLE001
-            build_config["reranker"]["options"] = []
-            build_config["reranker"]["options_metadata"] = []
-            # Set the default search field to vector search
-            build_config["search_method"]["show"] = False
-            build_config["search_method"]["options"] = ["Vector Search"]
-            build_config["search_method"]["value"] = "Vector Search"
-        return build_config
-    async def update_build_config(self, build_config: dict, field_value: str, field_name: str | None = None) -> dict:
-        """Update build configuration based on field name and value."""
-        # Early return if no token provided
-        if not self.token:
-            return self.reset_build_config(build_config)
-        # Database creation callback
-        if field_name == "database_name" and isinstance(field_value, dict):
-            if "01_new_database_name" in field_value:
-                await self._create_new_database(build_config, field_value)
-                return self.reset_collection_list(build_config)
-            return self._update_cloud_regions(build_config, field_value)
-        # Collection creation callback
-        if field_name == "collection_name" and isinstance(field_value, dict):
-            # Case 1: New collection creation
-            if "01_new_collection_name" in field_value:
-                await self._create_new_collection(build_config, field_value)
-                return build_config
-            # Case 2: Update embedding provider options
-            if "02_embedding_generation_provider" in field_value:
-                return self.reset_provider_options(build_config)
-            # Case 3: Update dimension field
-            if "03_embedding_generation_model" in field_value:
-                return self.reset_dimension_field(build_config)
-        # Initial execution or token/environment change
-        first_run = field_name == "collection_name" and not field_value and not build_config["database_name"]["options"]
-        if first_run or field_name in {"token", "environment"}:
-            return self.reset_database_list(build_config)
-        # Database selection change
-        if field_name == "database_name" and not isinstance(field_value, dict):
-            return self._handle_database_selection(build_config, field_value)
-        # Keyspace selection change
-        if field_name == "keyspace":
-            return self.reset_collection_list(build_config)
-        # Collection selection change
-        if field_name == "collection_name" and not isinstance(field_value, dict):
-            return self._handle_collection_selection(build_config, field_value)
-        # Search method selection change
-        if field_name == "search_method":
-            is_vector_search = field_value == "Vector Search"
-            is_autodetect = build_config["autodetect_collection"]["value"]
-            # Configure lexical terms (same for both cases)
-            build_config["lexical_terms"]["show"] = not is_vector_search
-            build_config["lexical_terms"]["value"] = "" if is_vector_search else build_config["lexical_terms"]["value"]
-            # Disable reranker disabling if hybrid search is selected
-            build_config["reranker"]["show"] = not is_vector_search
-            build_config["reranker"]["toggle_disable"] = not is_vector_search
-            build_config["reranker"]["toggle_value"] = True
-            build_config["reranker"]["value"] = build_config["reranker"]["options"][0]
-            # Toggle search type and score threshold based on search method
-            build_config["search_type"]["show"] = is_vector_search
-            build_config["search_score_threshold"]["show"] = is_vector_search
-            # Make sure the search_type is set to "Similarity"
-            if not is_vector_search or is_autodetect:
-                build_config["search_type"]["value"] = "Similarity"
-        return build_config
-    async def _create_new_database(self, build_config: dict, field_value: dict) -> None:
-        """Create a new database and update build config options."""
-        try:
-            await self.create_database_api(
-                new_database_name=field_value["01_new_database_name"],
-                token=self.token,
-                keyspace=self.get_keyspace(),
-                environment=self.environment,
-                cloud_provider=field_value["02_cloud_provider"],
-                region=field_value["03_region"],
-            )
-        except Exception as e:
-            msg = f"Error creating database: {e}"
-            raise ValueError(msg) from e
-        build_config["database_name"]["options"].append(field_value["01_new_database_name"])
-        build_config["database_name"]["options_metadata"].append(
-            {
-                "status": "PENDING",
-                "collections": 0,
-                "api_endpoints": [],
-                "keyspaces": [self.get_keyspace()],
-                "org_id": None,
-            }
-        )
-    def _update_cloud_regions(self, build_config: dict, field_value: dict) -> dict:
-        """Update cloud provider regions in build config."""
-        env = self.environment
-        cloud_provider = field_value["02_cloud_provider"]
-        # Update the region options based on the selected cloud provider
-        template = build_config["database_name"]["dialog_inputs"]["fields"]["data"]["node"]["template"]
-        template["03_region"]["options"] = self.map_cloud_providers()[env][cloud_provider]["regions"]
-        # Reset the the 03_region value if it's not in the new options
-        if template["03_region"]["value"] not in template["03_region"]["options"]:
-            template["03_region"]["value"] = None
-        return build_config
-    async def _create_new_collection(self, build_config: dict, field_value: dict) -> None:
-        """Create a new collection and update build config options."""
-        embedding_provider = field_value.get("02_embedding_generation_provider")
-        try:
-            await self.create_collection_api(
-                new_collection_name=field_value["01_new_collection_name"],
-                token=self.token,
-                api_endpoint=build_config["api_endpoint"]["value"],
-                environment=self.environment,
-                keyspace=self.get_keyspace(),
-                dimension=field_value.get("04_dimension") if embedding_provider == "Bring your own" else None,
-                embedding_generation_provider=embedding_provider,
-                embedding_generation_model=field_value.get("03_embedding_generation_model"),
-                reranker=self.reranker,
-            )
-        except Exception as e:
-            msg = f"Error creating collection: {e}"
-            raise ValueError(msg) from e
-        provider = embedding_provider.lower() if embedding_provider and embedding_provider != "Bring your own" else None
-        build_config["collection_name"].update(
-            {
-                "value": field_value["01_new_collection_name"],
-                "options": build_config["collection_name"]["options"] + [field_value["01_new_collection_name"]],
+        except Exception as e:  # noqa: BLE001
+            self.log(f"Hybrid search not available: {e}")
+            return {
+                "available": False,
+                "reranker_models": [],
+                "reranker_metadata": [],
             }
-        )
-        build_config["embedding_model"]["show"] = not bool(provider)
-        build_config["embedding_model"]["required"] = not bool(provider)
-        build_config["collection_name"]["options_metadata"].append(
-            {
-                "records": 0,
-                "provider": provider,
-                "icon": self.get_provider_icon(provider_name=provider),
-                "model": field_value.get("03_embedding_generation_model"),
+        else:
+            return {
+                "available": True,
+                "reranker_models": reranker_models,
+                "reranker_metadata": reranker_metadata,
             }
-        )
-        # Make sure we always show the reranker options if the collection is hybrid enabled
-        # And right now they always are
-        build_config["lexical_terms"]["show"] = True
-    def _handle_database_selection(self, build_config: dict, field_value: str) -> dict:
-        """Handle database selection and update related configurations."""
-        build_config = self.reset_database_list(build_config)
-        # Reset collection list if database selection changes
-        if field_value not in build_config["database_name"]["options"]:
-            build_config["database_name"]["value"] = ""
-            return build_config
-        # Get the api endpoint for the selected database
-        index = build_config["database_name"]["options"].index(field_value)
-        build_config["api_endpoint"]["options"] = build_config["database_name"]["options_metadata"][index][
-            "api_endpoints"
-        ]
-        build_config["api_endpoint"]["value"] = build_config["database_name"]["options_metadata"][index][
-            "api_endpoints"
-        ][0]
-        # Get the org_id for the selected database
-        org_id = build_config["database_name"]["options_metadata"][index]["org_id"]
-        if not org_id:
-            return build_config
-        # Update the list of keyspaces based on the db info
-        build_config["keyspace"]["options"] = build_config["database_name"]["options_metadata"][index]["keyspaces"]
-        build_config["keyspace"]["value"] = (
-            build_config["keyspace"]["options"] and build_config["keyspace"]["options"][0]
-            if build_config["keyspace"]["value"] not in build_config["keyspace"]["options"]
-            else build_config["keyspace"]["value"]
-        )
-        # Get the database id for the selected database
-        db_id = self.get_database_id_static(api_endpoint=build_config["api_endpoint"]["value"])
-        keyspace = self.get_keyspace()
-        # Update the helper text for the embedding provider field
-        template = build_config["collection_name"]["dialog_inputs"]["fields"]["data"]["node"]["template"]
-        template["02_embedding_generation_provider"]["helper_text"] = (
-            "To create collections with more embedding provider options, go to "
-            f'<a class="underline" target="_blank" rel="noopener noreferrer" '
-            f'href="https://astra.datastax.com/org/{org_id}/database/{db_id}/data-explorer?createCollection=1&namespace={keyspace}">'
-            "your database in Astra DB</a>."
-        )
-        # Reset provider options
-        build_config = self.reset_provider_options(build_config)
-        # Handle hybrid search options
-        build_config = self._handle_hybrid_search_options(build_config)
-        return self.reset_collection_list(build_config)
-    def _handle_collection_selection(self, build_config: dict, field_value: str) -> dict:
-        """Handle collection selection and update embedding options."""
-        build_config["autodetect_collection"]["value"] = True
-        build_config = self.reset_collection_list(build_config)
-        # Reset embedding model if collection selection changes
-        if field_value and field_value not in build_config["collection_name"]["options"]:
-            build_config["collection_name"]["options"].append(field_value)
-            build_config["collection_name"]["options_metadata"].append(
-                {
-                    "records": 0,
-                    "provider": None,
-                    "icon": "vectorstores",
-                    "model": None,
-                }
-            )
-            build_config["autodetect_collection"]["value"] = False
-        if not field_value:
-            return build_config
-        # Get the selected collection index
-        index = build_config["collection_name"]["options"].index(field_value)
-        # Set the provider of the selected collection
-        provider = build_config["collection_name"]["options_metadata"][index]["provider"]
-        build_config["embedding_model"]["show"] = not bool(provider)
-        build_config["embedding_model"]["required"] = not bool(provider)
-        # Grab the collection object
+    def _get_collection_options(self, build_config: dict) -> dict:
+        """Retrieve collection-level search options."""
         database = self.get_database_object(api_endpoint=build_config["api_endpoint"]["value"])
         collection = database.get_collection(
-            name=field_value,
+            name=build_config["collection_name"]["value"],
             keyspace=build_config["keyspace"]["value"],
         )
-        # Check if hybrid and lexical are enabled
         col_options = collection.options()
-        hyb_enabled = col_options.rerank and col_options.rerank.enabled
-        lex_enabled = col_options.lexical and col_options.lexical.enabled
-        user_hyb_enabled = build_config["search_method"]["value"] == "Hybrid Search"
-        # Reranker visible when both the collection supports it and the user selected Hybrid
-        hybrid_active = bool(hyb_enabled and user_hyb_enabled)
-        build_config["reranker"]["show"] = hybrid_active
-        build_config["reranker"]["toggle_value"] = hybrid_active
-        build_config["reranker"]["toggle_disable"] = False  # allow user to toggle if visible
-        # If hybrid is active, lock search_type to "Similarity"
-        if hybrid_active:
-            build_config["search_type"]["value"] = "Similarity"
-        # Show the lexical terms option only if the collection enables lexical search
-        build_config["lexical_terms"]["show"] = bool(lex_enabled)
-        return build_config
+        return {
+            "rerank_enabled": bool(col_options.rerank and col_options.rerank.enabled),
+            "lexical_enabled": bool(col_options.lexical and col_options.lexical.enabled),
+        }
     @check_cached_vector_store
     def build_vector_store(self):
         try:
             from langchain_astradb import AstraDBVectorStore
+            from langchain_astradb.utils.astradb import HybridSearchMode
         except ImportError as e:
             msg = (
                 "Could not import langchain Astra DB integration package. "
@@ -1164,7 +321,7 @@ class AstraDBVectorStoreComponent(LCVectorStoreComponent):
                 **embedding_params,
                 **additional_params,
             )
-        except Exception as e:
+        except ValueError as e:
             msg = f"Error initializing AstraDBVectorStore: {e}"
             raise ValueError(msg) from e
@@ -1196,7 +353,7 @@ class AstraDBVectorStoreComponent(LCVectorStoreComponent):
                 delete_values = list({doc.metadata[self.deletion_field] for doc in documents})
                 self.log(f"Deleting documents where {self.deletion_field} matches {delete_values}.")
                 collection.delete_many({f"metadata.{self.deletion_field}": {"$in": delete_values}})
-            except Exception as e:
+            except ValueError as e:
                 msg = f"Error deleting documents from AstraDBVectorStore based on '{self.deletion_field}': {e}"
                 raise ValueError(msg) from e
@@ -1204,7 +361,7 @@ class AstraDBVectorStoreComponent(LCVectorStoreComponent):
             self.log(f"Adding {len(documents)} documents to the Vector Store.")
             try:
                 vector_store.add_documents(documents)
-            except Exception as e:
+            except ValueError as e:
                 msg = f"Error adding documents to AstraDBVectorStore: {e}"
                 raise ValueError(msg) from e
         else:
@@ -1257,7 +414,7 @@ class AstraDBVectorStoreComponent(LCVectorStoreComponent):
         try:
             search_args = self._build_search_args()
-        except Exception as e:
+        except ValueError as e:
             msg = f"Error in AstraDBVectorStore._build_search_args: {e}"
             raise ValueError(msg) from e
@@ -1271,7 +428,7 @@ class AstraDBVectorStoreComponent(LCVectorStoreComponent):
         try:
             self.log(f"Calling vector_store.{search_method} with args: {search_args}")
             docs = getattr(vector_store, search_method)(**search_args)
-        except Exception as e:
+        except ValueError as e:
             msg = f"Error performing {search_method} in AstraDBVectorStore: {e}"
             raise ValueError(msg) from e

lfx-nightly 0.1.13.dev0__py3-none-any.whl → 0.2.0.dev26__py3-none-any.whl

lfx-nightly 0.1.13.dev0py3-none-any.whl → 0.2.0.dev26py3-none-any.whl