PyPI - MindsDB - Versions diffs - 25.9.2.0a1__py3-none-any.whl → 25.10.0__py3-none-any.whl - Mend

MindsDB 25.9.2.0a1py3-none-any.whl → 25.10.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of MindsDB might be problematic. Click here for more details.

Files changed (164) hide show

mindsdb/__about__.py +1 -1
mindsdb/__main__.py +40 -29
mindsdb/api/a2a/__init__.py +1 -1
mindsdb/api/a2a/agent.py +16 -10
mindsdb/api/a2a/common/server/server.py +7 -3
mindsdb/api/a2a/common/server/task_manager.py +12 -5
mindsdb/api/a2a/common/types.py +66 -0
mindsdb/api/a2a/task_manager.py +65 -17
mindsdb/api/common/middleware.py +10 -12
mindsdb/api/executor/command_executor.py +51 -40
mindsdb/api/executor/datahub/datanodes/datanode.py +2 -2
mindsdb/api/executor/datahub/datanodes/information_schema_datanode.py +7 -13
mindsdb/api/executor/datahub/datanodes/integration_datanode.py +101 -49
mindsdb/api/executor/datahub/datanodes/project_datanode.py +8 -4
mindsdb/api/executor/datahub/datanodes/system_tables.py +3 -2
mindsdb/api/executor/exceptions.py +29 -10
mindsdb/api/executor/planner/plan_join.py +17 -3
mindsdb/api/executor/planner/query_prepare.py +2 -20
mindsdb/api/executor/sql_query/sql_query.py +74 -74
mindsdb/api/executor/sql_query/steps/fetch_dataframe.py +1 -2
mindsdb/api/executor/sql_query/steps/subselect_step.py +0 -1
mindsdb/api/executor/utilities/functions.py +6 -6
mindsdb/api/executor/utilities/sql.py +37 -20
mindsdb/api/http/gui.py +5 -11
mindsdb/api/http/initialize.py +75 -61
mindsdb/api/http/namespaces/agents.py +10 -15
mindsdb/api/http/namespaces/analysis.py +13 -20
mindsdb/api/http/namespaces/auth.py +1 -1
mindsdb/api/http/namespaces/chatbots.py +0 -5
mindsdb/api/http/namespaces/config.py +15 -11
mindsdb/api/http/namespaces/databases.py +140 -201
mindsdb/api/http/namespaces/file.py +17 -4
mindsdb/api/http/namespaces/handlers.py +17 -7
mindsdb/api/http/namespaces/knowledge_bases.py +28 -7
mindsdb/api/http/namespaces/models.py +94 -126
mindsdb/api/http/namespaces/projects.py +13 -22
mindsdb/api/http/namespaces/sql.py +33 -25
mindsdb/api/http/namespaces/tab.py +27 -37
mindsdb/api/http/namespaces/views.py +1 -1
mindsdb/api/http/start.py +16 -10
mindsdb/api/mcp/__init__.py +2 -1
mindsdb/api/mysql/mysql_proxy/executor/mysql_executor.py +15 -20
mindsdb/api/mysql/mysql_proxy/mysql_proxy.py +26 -50
mindsdb/api/mysql/mysql_proxy/utilities/__init__.py +0 -1
mindsdb/api/mysql/mysql_proxy/utilities/dump.py +8 -2
mindsdb/integrations/handlers/byom_handler/byom_handler.py +165 -190
mindsdb/integrations/handlers/databricks_handler/databricks_handler.py +98 -46
mindsdb/integrations/handlers/druid_handler/druid_handler.py +32 -40
mindsdb/integrations/handlers/file_handler/file_handler.py +7 -0
mindsdb/integrations/handlers/gitlab_handler/gitlab_handler.py +5 -2
mindsdb/integrations/handlers/lightwood_handler/functions.py +45 -79
mindsdb/integrations/handlers/mssql_handler/mssql_handler.py +438 -100
mindsdb/integrations/handlers/mssql_handler/requirements_odbc.txt +3 -0
mindsdb/integrations/handlers/mysql_handler/mysql_handler.py +235 -3
mindsdb/integrations/handlers/oracle_handler/__init__.py +2 -0
mindsdb/integrations/handlers/oracle_handler/connection_args.py +7 -1
mindsdb/integrations/handlers/oracle_handler/oracle_handler.py +321 -16
mindsdb/integrations/handlers/oracle_handler/requirements.txt +1 -1
mindsdb/integrations/handlers/postgres_handler/postgres_handler.py +14 -2
mindsdb/integrations/handlers/shopify_handler/requirements.txt +1 -0
mindsdb/integrations/handlers/shopify_handler/shopify_handler.py +80 -13
mindsdb/integrations/handlers/snowflake_handler/snowflake_handler.py +2 -1
mindsdb/integrations/handlers/statsforecast_handler/requirements.txt +1 -0
mindsdb/integrations/handlers/statsforecast_handler/requirements_extra.txt +1 -0
mindsdb/integrations/handlers/web_handler/urlcrawl_helpers.py +4 -4
mindsdb/integrations/handlers/zendesk_handler/zendesk_tables.py +144 -111
mindsdb/integrations/libs/api_handler.py +10 -10
mindsdb/integrations/libs/base.py +4 -4
mindsdb/integrations/libs/llm/utils.py +2 -2
mindsdb/integrations/libs/ml_handler_process/create_engine_process.py +4 -7
mindsdb/integrations/libs/ml_handler_process/func_call_process.py +2 -7
mindsdb/integrations/libs/ml_handler_process/learn_process.py +37 -47
mindsdb/integrations/libs/ml_handler_process/update_engine_process.py +4 -7
mindsdb/integrations/libs/ml_handler_process/update_process.py +2 -7
mindsdb/integrations/libs/process_cache.py +132 -140
mindsdb/integrations/libs/response.py +18 -12
mindsdb/integrations/libs/vectordatabase_handler.py +26 -0
mindsdb/integrations/utilities/files/file_reader.py +6 -7
mindsdb/integrations/utilities/handlers/auth_utilities/snowflake/__init__.py +1 -0
mindsdb/integrations/utilities/handlers/auth_utilities/snowflake/snowflake_jwt_gen.py +151 -0
mindsdb/integrations/utilities/rag/config_loader.py +37 -26
mindsdb/integrations/utilities/rag/rerankers/base_reranker.py +83 -30
mindsdb/integrations/utilities/rag/rerankers/reranker_compressor.py +4 -4
mindsdb/integrations/utilities/rag/retrievers/sql_retriever.py +55 -133
mindsdb/integrations/utilities/rag/settings.py +58 -133
mindsdb/integrations/utilities/rag/splitters/file_splitter.py +5 -15
mindsdb/interfaces/agents/agents_controller.py +2 -3
mindsdb/interfaces/agents/constants.py +0 -2
mindsdb/interfaces/agents/litellm_server.py +34 -58
mindsdb/interfaces/agents/mcp_client_agent.py +10 -10
mindsdb/interfaces/agents/mindsdb_database_agent.py +5 -5
mindsdb/interfaces/agents/run_mcp_agent.py +12 -21
mindsdb/interfaces/chatbot/chatbot_task.py +20 -23
mindsdb/interfaces/chatbot/polling.py +30 -18
mindsdb/interfaces/data_catalog/data_catalog_loader.py +16 -17
mindsdb/interfaces/data_catalog/data_catalog_reader.py +15 -4
mindsdb/interfaces/database/data_handlers_cache.py +190 -0
mindsdb/interfaces/database/database.py +3 -3
mindsdb/interfaces/database/integrations.py +7 -110
mindsdb/interfaces/database/projects.py +2 -6
mindsdb/interfaces/database/views.py +1 -4
mindsdb/interfaces/file/file_controller.py +6 -6
mindsdb/interfaces/functions/controller.py +1 -1
mindsdb/interfaces/functions/to_markdown.py +2 -2
mindsdb/interfaces/jobs/jobs_controller.py +5 -9
mindsdb/interfaces/jobs/scheduler.py +3 -9
mindsdb/interfaces/knowledge_base/controller.py +244 -128
mindsdb/interfaces/knowledge_base/evaluate.py +36 -41
mindsdb/interfaces/knowledge_base/executor.py +11 -0
mindsdb/interfaces/knowledge_base/llm_client.py +51 -17
mindsdb/interfaces/knowledge_base/preprocessing/json_chunker.py +40 -61
mindsdb/interfaces/model/model_controller.py +172 -168
mindsdb/interfaces/query_context/context_controller.py +14 -2
mindsdb/interfaces/skills/custom/text2sql/mindsdb_sql_toolkit.py +10 -14
mindsdb/interfaces/skills/retrieval_tool.py +43 -50
mindsdb/interfaces/skills/skill_tool.py +2 -2
mindsdb/interfaces/skills/skills_controller.py +1 -4
mindsdb/interfaces/skills/sql_agent.py +25 -19
mindsdb/interfaces/storage/db.py +16 -6
mindsdb/interfaces/storage/fs.py +114 -169
mindsdb/interfaces/storage/json.py +19 -18
mindsdb/interfaces/tabs/tabs_controller.py +49 -72
mindsdb/interfaces/tasks/task_monitor.py +3 -9
mindsdb/interfaces/tasks/task_thread.py +7 -9
mindsdb/interfaces/triggers/trigger_task.py +7 -13
mindsdb/interfaces/triggers/triggers_controller.py +47 -52
mindsdb/migrations/migrate.py +16 -16
mindsdb/utilities/api_status.py +58 -0
mindsdb/utilities/config.py +68 -2
mindsdb/utilities/exception.py +40 -1
mindsdb/utilities/fs.py +0 -1
mindsdb/utilities/hooks/profiling.py +17 -14
mindsdb/utilities/json_encoder.py +24 -10
mindsdb/utilities/langfuse.py +40 -45
mindsdb/utilities/log.py +272 -0
mindsdb/utilities/ml_task_queue/consumer.py +52 -58
mindsdb/utilities/ml_task_queue/producer.py +26 -30
mindsdb/utilities/render/sqlalchemy_render.py +22 -20
mindsdb/utilities/starters.py +0 -10
mindsdb/utilities/utils.py +2 -2
{mindsdb-25.9.2.0a1.dist-info → mindsdb-25.10.0.dist-info}/METADATA +286 -267
{mindsdb-25.9.2.0a1.dist-info → mindsdb-25.10.0.dist-info}/RECORD +145 -159
mindsdb/api/mysql/mysql_proxy/utilities/exceptions.py +0 -14
mindsdb/api/postgres/__init__.py +0 -0
mindsdb/api/postgres/postgres_proxy/__init__.py +0 -0
mindsdb/api/postgres/postgres_proxy/executor/__init__.py +0 -1
mindsdb/api/postgres/postgres_proxy/executor/executor.py +0 -189
mindsdb/api/postgres/postgres_proxy/postgres_packets/__init__.py +0 -0
mindsdb/api/postgres/postgres_proxy/postgres_packets/errors.py +0 -322
mindsdb/api/postgres/postgres_proxy/postgres_packets/postgres_fields.py +0 -34
mindsdb/api/postgres/postgres_proxy/postgres_packets/postgres_message.py +0 -31
mindsdb/api/postgres/postgres_proxy/postgres_packets/postgres_message_formats.py +0 -1265
mindsdb/api/postgres/postgres_proxy/postgres_packets/postgres_message_identifiers.py +0 -31
mindsdb/api/postgres/postgres_proxy/postgres_packets/postgres_packets.py +0 -253
mindsdb/api/postgres/postgres_proxy/postgres_proxy.py +0 -477
mindsdb/api/postgres/postgres_proxy/utilities/__init__.py +0 -10
mindsdb/api/postgres/start.py +0 -11
mindsdb/integrations/handlers/mssql_handler/tests/__init__.py +0 -0
mindsdb/integrations/handlers/mssql_handler/tests/test_mssql_handler.py +0 -169
mindsdb/integrations/handlers/oracle_handler/tests/__init__.py +0 -0
mindsdb/integrations/handlers/oracle_handler/tests/test_oracle_handler.py +0 -32
{mindsdb-25.9.2.0a1.dist-info → mindsdb-25.10.0.dist-info}/WHEEL +0 -0
{mindsdb-25.9.2.0a1.dist-info → mindsdb-25.10.0.dist-info}/licenses/LICENSE +0 -0
{mindsdb-25.9.2.0a1.dist-info → mindsdb-25.10.0.dist-info}/top_level.txt +0 -0

mindsdb/integrations/utilities/rag/retrievers/sql_retriever.py CHANGED Viewed

@@ -1,10 +1,10 @@
 import re
-from pydantic import BaseModel, Field
-from typing import List, Any, Optional, Dict, Tuple, Union, Callable
-import collections
 import math
+import logging
+import collections
+from typing import List, Any, Optional, Dict, Tuple, Union, Callable
+from pydantic import BaseModel, Field
 from langchain.chains.llm import LLMChain
 from langchain_core.callbacks.manager import CallbackManagerForRetrieverRun
 from langchain_core.documents.base import Document
@@ -39,9 +39,7 @@ class MetadataFilter(BaseModel):
     """Represents an LLM generated metadata filter to apply to a PostgreSQL query."""
     attribute: str = Field(description="Database column to apply filter to")
-    comparator: str = Field(
-        description="PostgreSQL comparator to use to filter database column"
-    )
+    comparator: str = Field(description="PostgreSQL comparator to use to filter database column")
     value: Any = Field(description="Value to use to filter database column")
@@ -56,9 +54,7 @@ class AblativeMetadataFilter(MetadataFilter):
 class MetadataFilters(BaseModel):
     """List of LLM generated metadata filters to apply to a PostgreSQL query."""
-    filters: List[MetadataFilter] = Field(
-        description="List of PostgreSQL metadata filters to apply for user query"
-    )
+    filters: List[MetadataFilter] = Field(description="List of PostgreSQL metadata filters to apply for user query")
 class SQLRetriever(BaseRetriever):
@@ -142,25 +138,17 @@ class SQLRetriever(BaseRetriever):
         elif isinstance(schema, ColumnSchema):
             collection_key = "values"
         else:
-            raise Exception(
-                "schema must be either a DatabaseSchema, TableSchema, or ColumnSchema."
-            )
+            raise Exception("schema must be either a DatabaseSchema, TableSchema, or ColumnSchema.")
         if update is not None:
-            ordered = collections.OrderedDict(
-                sorted(update.items(), key=key, reverse=True)
-            )
+            ordered = collections.OrderedDict(sorted(update.items(), key=key, reverse=True))
         else:
-            ordered = collections.OrderedDict(
-                sorted(getattr(schema, collection_key).items(), key=key, reverse=True)
-            )
+            ordered = collections.OrderedDict(sorted(getattr(schema, collection_key).items(), key=key, reverse=True))
         schema = schema.model_copy(update={collection_key: ordered})
         return schema
-    def _sort_database_schema_by_key(
-        self, database_schema: DatabaseSchema, key: Callable
-    ) -> DatabaseSchema:
+    def _sort_database_schema_by_key(self, database_schema: DatabaseSchema, key: Callable) -> DatabaseSchema:
         """Re-build schema with OrderedDicts"""
         tables = {}
         # build new tables dict
@@ -169,17 +157,11 @@ class SQLRetriever(BaseRetriever):
             # build new column dict
             for column_key, column_schema in table_schema.columns.items():
                 # sort values directly and update column schema
-                columns[column_key] = self._sort_schema_by_key(
-                    schema=column_schema, key=key
-                )
+                columns[column_key] = self._sort_schema_by_key(schema=column_schema, key=key)
             # update table schema and sort
-            tables[table_key] = self._sort_schema_by_key(
-                schema=table_schema, key=key, update=columns
-            )
+            tables[table_key] = self._sort_schema_by_key(schema=table_schema, key=key, update=columns)
         # update table schema and sort
-        database_schema = self._sort_schema_by_key(
-            schema=database_schema, key=key, update=tables
-        )
+        database_schema = self._sort_schema_by_key(schema=database_schema, key=key, update=tables)
         return database_schema
@@ -191,15 +173,12 @@ class SQLRetriever(BaseRetriever):
         boolean_system_prompt: bool = True,
         format_instructions: Optional[str] = None,
     ) -> ChatPromptTemplate:
         if boolean_system_prompt is True:
             system_prompt = self.boolean_system_prompt
         else:
             system_prompt = self.generative_system_prompt
-        prepared_column_prompt = self._prepare_column_prompt(
-            column_schema=column_schema, table_schema=table_schema
-        )
+        prepared_column_prompt = self._prepare_column_prompt(column_schema=column_schema, table_schema=table_schema)
         column_schema_str = (
             prepared_column_prompt.messages[1]
             .format(
@@ -290,7 +269,6 @@ Below is a list of comparison operators for constructing filters for this value
         table_schema: TableSchema,
         boolean_system_prompt: bool = True,
     ) -> ChatPromptTemplate:
         if boolean_system_prompt is True:
             system_prompt = self.boolean_system_prompt
         else:
@@ -312,9 +290,7 @@ Below is a list of comparison operators for constructing filters for this value
             [("system", system_prompt), ("user", self.column_prompt_template)]
         )
-        header_str = (
-            f"This schema describes a column in the {table_schema.table} table."
-        )
+        header_str = f"This schema describes a column in the {table_schema.table} table."
         value_str = """
 ## **Content**
@@ -388,26 +364,18 @@ Below is a description of the contents in this column in list format:
         )
     def _rank_schema(self, prompt: ChatPromptTemplate, query: str) -> float:
-        rank_chain = LLMChain(
-            llm=self.llm.bind(logprobs=True), prompt=prompt, return_final_only=False
-        )
+        rank_chain = LLMChain(llm=self.llm.bind(logprobs=True), prompt=prompt, return_final_only=False)
         output = rank_chain({"query": query})  # returns metadata
         #  parse through metadata tokens until encountering either yes, or no.
         score = None  # a None score indicates the model output could not be parsed.
-        for content in output["full_generation"][0].message.response_metadata[
-            "logprobs"
-        ]["content"]:
+        for content in output["full_generation"][0].message.response_metadata["logprobs"]["content"]:
             #  Convert answer to score using the model's confidence
             if content["token"].lower().strip() == "yes":
-                score = (
-                    1 + math.exp(content["logprob"])
-                ) / 2  # If yes, use the model's confidence
+                score = (1 + math.exp(content["logprob"])) / 2  # If yes, use the model's confidence
                 break
             elif content["token"].lower().strip() == "no":
-                score = (
-                    1 - math.exp(content["logprob"])
-                ) / 2  # If no, invert the confidence
+                score = (1 - math.exp(content["logprob"])) / 2  # If no, invert the confidence
                 break
         if score is None:
@@ -465,9 +433,7 @@ Below is a description of the contents in this column in list format:
                         table_schema=table_schema,
                         boolean_system_prompt=True,
                     )
-                    column_schema.relevance = self._rank_schema(
-                        prompt=prompt, query=query
-                    )
+                    column_schema.relevance = self._rank_schema(prompt=prompt, query=query)
                     columns[column_key] = column_schema
@@ -512,9 +478,7 @@ Below is a description of the contents in this column in list format:
                             table_schema=table_schema,
                             boolean_system_prompt=True,
                         )
-                        value_schema.relevance = self._rank_schema(
-                            prompt=prompt, query=query
-                        )
+                        value_schema.relevance = self._rank_schema(prompt=prompt, query=query)
                         values[value_key] = value_schema
@@ -592,19 +556,13 @@ Below is a description of the contents in this column in list format:
         for table_key, table_schema in ordered_database_schema.tables.items():
             for column_key, column_schema in table_schema.columns.items():
                 for value_key, value_schema in column_schema.values.items():
-                    ablation_value_dict[(table_key, column_key, value_key)] = (
-                        value_schema.relevance
-                    )
+                    ablation_value_dict[(table_key, column_key, value_key)] = value_schema.relevance
-        ablation_value_dict = collections.OrderedDict(
-            sorted(ablation_value_dict.items(), key=lambda x: x[1])
-        )
+        ablation_value_dict = collections.OrderedDict(sorted(ablation_value_dict.items(), key=lambda x: x[1]))
         relevance_scores = list(ablation_value_dict.values())
         if len(relevance_scores) > 0:
-            ablation_quantiles = np.quantile(
-                relevance_scores, np.linspace(0, 1, self.num_retries + 2)[1:-1]
-            )
+            ablation_quantiles = np.quantile(relevance_scores, np.linspace(0, 1, self.num_retries + 2)[1:-1])
         else:
             ablation_quantiles = None
@@ -628,11 +586,7 @@ Below is a description of the contents in this column in list format:
         ablated_filters = []
         for filter in metadata_filters:
             for key in ablated_dict.keys():
-                if (
-                    filter.schema_table in key
-                    and filter.schema_column in key
-                    and filter.schema_value in key
-                ):
+                if filter.schema_table in key and filter.schema_column in key and filter.schema_value in key:
                     ablated_filters.append(filter)
         return ablated_filters
@@ -646,9 +600,7 @@ Below is a description of the contents in this column in list format:
         pass
     def _prepare_retrieval_query(self, query: str) -> str:
-        rewrite_prompt = PromptTemplate(
-            input_variables=["input"], template=self.rewrite_prompt_template
-        )
+        rewrite_prompt = PromptTemplate(input_variables=["input"], template=self.rewrite_prompt_template)
         rewrite_chain = LLMChain(llm=self.llm, prompt=rewrite_prompt)
         return rewrite_chain.predict(input=query)
@@ -668,9 +620,7 @@ Below is a description of the contents in this column in list format:
         # Add Table JOIN statements
         join_clauses = set()
         for metadata_filter in metadata_filters:
-            join_clause = ranked_database_schema.tables[
-                metadata_filter.schema_table
-            ].join
+            join_clause = ranked_database_schema.tables[metadata_filter.schema_table].join
             if join_clause in join_clauses:
                 continue
             else:
@@ -688,12 +638,12 @@ Below is a description of the contents in this column in list format:
             if i < len(metadata_filters) - 1:
                 base_query += " AND "
-        base_query += f" ORDER BY e.embeddings {self.distance_function.value[0]} '{{embeddings}}' LIMIT {self.search_kwargs.k};"
+        base_query += (
+            f" ORDER BY e.embeddings {self.distance_function.value[0]} '{{embeddings}}' LIMIT {self.search_kwargs.k};"
+        )
         return base_query
-    def _generate_filter(
-        self, prompt: ChatPromptTemplate, query: str
-    ) -> MetadataFilter:
+    def _generate_filter(self, prompt: ChatPromptTemplate, query: str) -> MetadataFilter:
         gen_filter_chain = LLMChain(llm=self.llm, prompt=prompt)
         output = gen_filter_chain({"query": query})
         return output
@@ -714,28 +664,22 @@ Below is a description of the contents in this column in list format:
                         # must use generation if field is a dictionary of tuples or a list
                         if type(value_schema.value) in [list, dict]:
                             try:
-                                metadata_prompt: ChatPromptTemplate = (
-                                    self._prepare_value_prompt(
-                                        format_instructions=parser.get_format_instructions(),
-                                        value_schema=value_schema,
-                                        column_schema=column_schema,
-                                        table_schema=table_schema,
-                                        boolean_system_prompt=False,
-                                    )
+                                metadata_prompt: ChatPromptTemplate = self._prepare_value_prompt(
+                                    format_instructions=parser.get_format_instructions(),
+                                    value_schema=value_schema,
+                                    column_schema=column_schema,
+                                    table_schema=table_schema,
+                                    boolean_system_prompt=False,
                                 )
-                                metadata_filters_chain = LLMChain(
-                                    llm=self.llm, prompt=metadata_prompt
-                                )
+                                metadata_filters_chain = LLMChain(llm=self.llm, prompt=metadata_prompt)
                                 metadata_filter_output = metadata_filters_chain.predict(
                                     query=query,
                                 )
                                 # If the LLM outputs raw JSON, use it as-is.
                                 # If the LLM outputs anything including a json markdown section, use the last one.
-                                json_markdown_output = re.findall(
-                                    r"```json.*```", metadata_filter_output, re.DOTALL
-                                )
+                                json_markdown_output = re.findall(r"```json.*```", metadata_filter_output, re.DOTALL)
                                 if json_markdown_output:
                                     metadata_filter_output = json_markdown_output[-1]
                                     # Clean the json tags.
@@ -754,11 +698,10 @@ Below is a description of the contents in this column in list format:
                                 metadata_filter = AblativeMetadataFilter(**model_dump)
                             except OutputParserException as e:
                                 logger.warning(
-                                    f"LLM failed to generate structured metadata filters: {str(e)}"
-                                )
-                                return HandlerResponse(
-                                    RESPONSE_TYPE.ERROR, error_message=str(e)
+                                    f"LLM failed to generate structured metadata filters: {e}",
+                                    exc_info=logger.isEnabledFor(logging.DEBUG),
                                 )
+                                return HandlerResponse(RESPONSE_TYPE.ERROR, error_message=str(e))
                         else:
                             metadata_filter = AblativeMetadataFilter(
                                 attribute=column_schema.column,
@@ -779,24 +722,17 @@ Below is a description of the contents in this column in list format:
         embeddings_str: str,
     ) -> HandlerResponse:
         try:
-            checked_sql_query = self._prepare_pgvector_query(
-                ranked_database_schema, metadata_filters
-            )
-            checked_sql_query_with_embeddings = checked_sql_query.format(
-                embeddings=embeddings_str
-            )
-            return self.vector_store_handler.native_query(
-                checked_sql_query_with_embeddings
-            )
+            checked_sql_query = self._prepare_pgvector_query(ranked_database_schema, metadata_filters)
+            checked_sql_query_with_embeddings = checked_sql_query.format(embeddings=embeddings_str)
+            return self.vector_store_handler.native_query(checked_sql_query_with_embeddings)
         except Exception as e:
             logger.warning(
-                f"Failed to prepare and execute SQL query from structured metadata: {str(e)}"
+                f"Failed to prepare and execute SQL query from structured metadata: {e}",
+                exc_info=logger.isEnabledFor(logging.DEBUG),
             )
             return HandlerResponse(RESPONSE_TYPE.ERROR, error_message=str(e))
-    def _get_relevant_documents(
-        self, query: str, *, run_manager: CallbackManagerForRetrieverRun
-    ) -> List[Document]:
+    def _get_relevant_documents(self, query: str, *, run_manager: CallbackManagerForRetrieverRun) -> List[Document]:
         # Rewrite query to be suitable for retrieval.
         retrieval_query = self._prepare_retrieval_query(query)
@@ -804,14 +740,10 @@ Below is a description of the contents in this column in list format:
         embedded_query = self.embeddings_model.embed_query(retrieval_query)
         # Search for relevant filters
-        ranked_database_schema, ablation_value_dict, ablation_quantiles = (
-            self._breadth_first_search(query=query)
-        )
+        ranked_database_schema, ablation_value_dict, ablation_quantiles = self._breadth_first_search(query=query)
         # Generate metadata filters
-        metadata_filters = self._generate_metadata_filters(
-            query=query, ranked_database_schema=ranked_database_schema
-        )
+        metadata_filters = self._generate_metadata_filters(query=query, ranked_database_schema=ranked_database_schema)
         if type(metadata_filters) is list:
             # Initial Execution of the similarity search with metadata filters.
@@ -830,9 +762,7 @@ Below is a description of the contents in this column in list format:
                     break
                 elif document_response.resp_type == RESPONSE_TYPE.ERROR:
                     # LLMs won't always generate structured metadata so we should have a fallback after retrying.
-                    logger.info(
-                        f"SQL Retriever query failed with error {document_response.error_message}"
-                    )
+                    logger.info(f"SQL Retriever query failed with error {document_response.error_message}")
                 else:
                     logger.info(
                         f"SQL Retriever did not retrieve {self.min_k} documents: {len(document_response.data_frame)} documents retrieved."
@@ -867,17 +797,9 @@ Below is a description of the contents in this column in list format:
                 return retrieved_documents
             # If the SQL query constructed did not return any documents, fallback.
-            logger.info(
-                "No documents returned from SQL retriever, using fallback retriever."
-            )
-            return self.fallback_retriever._get_relevant_documents(
-                retrieval_query, run_manager=run_manager
-            )
+            logger.info("No documents returned from SQL retriever, using fallback retriever.")
+            return self.fallback_retriever._get_relevant_documents(retrieval_query, run_manager=run_manager)
         else:
             # If no metadata fields could be generated fallback.
-            logger.info(
-                "No metadata fields were successfully generated, using fallback retriever."
-            )
-            return self.fallback_retriever._get_relevant_documents(
-                retrieval_query, run_manager=run_manager
-            )
+            logger.info("No metadata fields were successfully generated, using fallback retriever.")
+            return self.fallback_retriever._get_relevant_documents(retrieval_query, run_manager=run_manager)

MindsDB 25.9.2.0a1__py3-none-any.whl → 25.10.0__py3-none-any.whl

Potentially problematic release.

MindsDB 25.9.2.0a1py3-none-any.whl → 25.10.0py3-none-any.whl