PyPI - MindsDB - Versions diffs - 25.5.4.2__py3-none-any.whl → 25.6.3.0__py3-none-any.whl - Mend

MindsDB 25.5.4.2py3-none-any.whl → 25.6.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of MindsDB might be problematic. Click here for more details.

Files changed (76) hide show

mindsdb/__about__.py +1 -1
mindsdb/api/a2a/agent.py +50 -26
mindsdb/api/a2a/common/server/server.py +32 -26
mindsdb/api/a2a/task_manager.py +68 -6
mindsdb/api/executor/command_executor.py +69 -14
mindsdb/api/executor/datahub/datanodes/integration_datanode.py +49 -65
mindsdb/api/executor/datahub/datanodes/mindsdb_tables.py +91 -84
mindsdb/api/executor/datahub/datanodes/project_datanode.py +29 -48
mindsdb/api/executor/datahub/datanodes/system_tables.py +35 -61
mindsdb/api/executor/planner/plan_join.py +67 -77
mindsdb/api/executor/planner/query_planner.py +176 -155
mindsdb/api/executor/planner/steps.py +37 -12
mindsdb/api/executor/sql_query/result_set.py +45 -64
mindsdb/api/executor/sql_query/steps/fetch_dataframe.py +14 -18
mindsdb/api/executor/sql_query/steps/fetch_dataframe_partition.py +17 -18
mindsdb/api/executor/sql_query/steps/insert_step.py +13 -33
mindsdb/api/executor/sql_query/steps/subselect_step.py +43 -35
mindsdb/api/executor/utilities/sql.py +42 -48
mindsdb/api/http/namespaces/config.py +1 -1
mindsdb/api/http/namespaces/file.py +14 -23
mindsdb/api/http/namespaces/knowledge_bases.py +132 -154
mindsdb/api/mysql/mysql_proxy/data_types/mysql_datum.py +12 -28
mindsdb/api/mysql/mysql_proxy/data_types/mysql_packets/binary_resultset_row_package.py +59 -50
mindsdb/api/mysql/mysql_proxy/data_types/mysql_packets/resultset_row_package.py +9 -8
mindsdb/api/mysql/mysql_proxy/libs/constants/mysql.py +449 -461
mindsdb/api/mysql/mysql_proxy/utilities/dump.py +87 -36
mindsdb/integrations/handlers/bigquery_handler/bigquery_handler.py +219 -28
mindsdb/integrations/handlers/file_handler/file_handler.py +15 -9
mindsdb/integrations/handlers/file_handler/tests/test_file_handler.py +43 -24
mindsdb/integrations/handlers/litellm_handler/litellm_handler.py +10 -3
mindsdb/integrations/handlers/llama_index_handler/requirements.txt +1 -1
mindsdb/integrations/handlers/mysql_handler/mysql_handler.py +29 -33
mindsdb/integrations/handlers/openai_handler/openai_handler.py +277 -356
mindsdb/integrations/handlers/oracle_handler/oracle_handler.py +74 -51
mindsdb/integrations/handlers/postgres_handler/postgres_handler.py +305 -98
mindsdb/integrations/handlers/salesforce_handler/salesforce_handler.py +145 -40
mindsdb/integrations/handlers/salesforce_handler/salesforce_tables.py +136 -6
mindsdb/integrations/handlers/snowflake_handler/snowflake_handler.py +352 -83
mindsdb/integrations/libs/api_handler.py +279 -57
mindsdb/integrations/libs/base.py +185 -30
mindsdb/integrations/utilities/files/file_reader.py +99 -73
mindsdb/integrations/utilities/handler_utils.py +23 -8
mindsdb/integrations/utilities/sql_utils.py +35 -40
mindsdb/interfaces/agents/agents_controller.py +226 -196
mindsdb/interfaces/agents/constants.py +8 -1
mindsdb/interfaces/agents/langchain_agent.py +42 -11
mindsdb/interfaces/agents/mcp_client_agent.py +29 -21
mindsdb/interfaces/agents/mindsdb_database_agent.py +23 -18
mindsdb/interfaces/data_catalog/__init__.py +0 -0
mindsdb/interfaces/data_catalog/base_data_catalog.py +54 -0
mindsdb/interfaces/data_catalog/data_catalog_loader.py +375 -0
mindsdb/interfaces/data_catalog/data_catalog_reader.py +38 -0
mindsdb/interfaces/database/database.py +81 -57
mindsdb/interfaces/database/integrations.py +222 -234
mindsdb/interfaces/database/log.py +72 -104
mindsdb/interfaces/database/projects.py +156 -193
mindsdb/interfaces/file/file_controller.py +21 -65
mindsdb/interfaces/knowledge_base/controller.py +66 -25
mindsdb/interfaces/knowledge_base/evaluate.py +516 -0
mindsdb/interfaces/knowledge_base/llm_client.py +75 -0
mindsdb/interfaces/skills/custom/text2sql/mindsdb_kb_tools.py +83 -43
mindsdb/interfaces/skills/skills_controller.py +31 -36
mindsdb/interfaces/skills/sql_agent.py +113 -86
mindsdb/interfaces/storage/db.py +242 -82
mindsdb/migrations/versions/2025-05-28_a44643042fe8_added_data_catalog_tables.py +118 -0
mindsdb/migrations/versions/2025-06-09_608e376c19a7_updated_data_catalog_data_types.py +58 -0
mindsdb/utilities/config.py +13 -2
mindsdb/utilities/log.py +35 -26
mindsdb/utilities/ml_task_queue/task.py +19 -22
mindsdb/utilities/render/sqlalchemy_render.py +129 -181
mindsdb/utilities/starters.py +40 -0
{mindsdb-25.5.4.2.dist-info → mindsdb-25.6.3.0.dist-info}/METADATA +257 -257
{mindsdb-25.5.4.2.dist-info → mindsdb-25.6.3.0.dist-info}/RECORD +76 -68
{mindsdb-25.5.4.2.dist-info → mindsdb-25.6.3.0.dist-info}/WHEEL +0 -0
{mindsdb-25.5.4.2.dist-info → mindsdb-25.6.3.0.dist-info}/licenses/LICENSE +0 -0
{mindsdb-25.5.4.2.dist-info → mindsdb-25.6.3.0.dist-info}/top_level.txt +0 -0

mindsdb/utilities/config.py CHANGED Viewed

@@ -217,6 +217,9 @@ class Config:
                 "project_name": "mindsdb",
                 "enabled": False,
             },
+            "data_catalog": {
+                "enabled": False,
+            },
         }
         # endregion
@@ -360,6 +363,8 @@ class Config:
             self._env_config["default_reranking_model"] = {
                 "api_key": os.environ["MINDSDB_DEFAULT_RERANKING_MODEL_API_KEY"]
             }
+        if os.environ.get("MINDSDB_DATA_CATALOG_ENABLED", "").lower() in ("1", "true"):
+            self._env_config["data_catalog"] = {"enabled": True}
         # region vars: a2a configuration
         a2a_config = {}
@@ -395,11 +400,17 @@ class Config:
             bool: True if config was loaded or updated
         """
-        if self.auto_config_mtime != self.auto_config_path.stat().st_mtime:
+        if (
+            self.auto_config_path.is_file()
+            and self.auto_config_path.read_text() != ""
+            and self.auto_config_mtime != self.auto_config_path.stat().st_mtime
+        ):
             try:
                 self._auto_config = json.loads(self.auto_config_path.read_text())
             except json.JSONDecodeError as e:
-                raise ValueError(f"The 'auto' configuration file ({self.auto_config_path}) contains invalid JSON: {e}")
+                raise ValueError(
+                    f"The 'auto' configuration file ({self.auto_config_path}) contains invalid JSON: {e}\nFile content: {self.auto_config_path.read_text()}"
+                )
             self.auto_config_mtime = self.auto_config_path.stat().st_mtime
             return True
         return False

mindsdb/utilities/log.py CHANGED Viewed

@@ -12,11 +12,11 @@ class JsonFormatter(logging.Formatter):
     def format(self, record):
         record_message = super().format(record)
         log_record = {
-            'process_name': record.processName,
-            'name': record.name,
-            'message': record_message,
-            'level': record.levelname,
-            'time': record.created
+            "process_name": record.processName,
+            "name": record.name,
+            "message": record_message,
+            "level": record.levelname,
+            "time": record.created,
         }
         return json.dumps(log_record)
@@ -44,12 +44,12 @@ class ColorFormatter(logging.Formatter):
 def get_console_handler_config_level() -> int:
-    console_handler_config = app_config['logging']['handlers']['console']
+    console_handler_config = app_config["logging"]["handlers"]["console"]
     return getattr(logging, console_handler_config["level"])
 def get_file_handler_config_level() -> int:
-    file_handler_config = app_config['logging']['handlers']['file']
+    file_handler_config = app_config["logging"]["handlers"]["file"]
     return getattr(logging, file_handler_config["level"])
@@ -60,27 +60,34 @@ def get_mindsdb_log_level() -> int:
     return min(console_handler_config_level, file_handler_config_level)
-def configure_logging():
+def configure_logging(process_name: str = None):
     handlers_config = {}
-    console_handler_config = app_config['logging']['handlers']['console']
+    console_handler_config = app_config["logging"]["handlers"]["console"]
     console_handler_config_level = getattr(logging, console_handler_config["level"])
-    if console_handler_config['enabled'] is True:
-        handlers_config['console'] = {
+    if console_handler_config["enabled"] is True:
+        handlers_config["console"] = {
             "class": "logging.StreamHandler",
-            "formatter": console_handler_config.get('formatter', 'default'),
-            "level": console_handler_config_level
+            "formatter": console_handler_config.get("formatter", "default"),
+            "level": console_handler_config_level,
         }
-    file_handler_config = app_config['logging']['handlers']['file']
+    file_handler_config = app_config["logging"]["handlers"]["file"]
     file_handler_config_level = getattr(logging, file_handler_config["level"])
-    if file_handler_config['enabled'] is True:
-        handlers_config['file'] = {
+    if file_handler_config["enabled"] is True:
+        file_name = file_handler_config["filename"]
+        if process_name is not None:
+            if "." in file_name:
+                parts = file_name.rpartition(".")
+                file_name = f"{parts[0]}_{process_name}.{parts[2]}"
+            else:
+                file_name = f"{file_name}_{process_name}"
+        handlers_config["file"] = {
             "class": "logging.handlers.RotatingFileHandler",
             "formatter": "file",
             "level": file_handler_config_level,
-            "filename": app_config.paths["log"] / file_handler_config["filename"],
+            "filename": app_config.paths["log"] / file_name,
             "maxBytes": file_handler_config["maxBytes"],  # 0.5 Mb
-            "backupCount": file_handler_config["backupCount"]
+            "backupCount": file_handler_config["backupCount"],
         }
     mindsdb_log_level = get_mindsdb_log_level()
@@ -90,9 +97,7 @@ def configure_logging():
         formatters={
             "default": {"()": ColorFormatter},
             "json": {"()": JsonFormatter},
-            "file": {
-                "format": "%(asctime)s %(processName)15s %(levelname)-8s %(name)s: %(message)s"
-            }
+            "file": {"format": "%(asctime)s %(processName)15s %(levelname)-8s %(name)s: %(message)s"},
         },
         handlers=handlers_config,
         loggers={
@@ -115,6 +120,14 @@ def configure_logging():
     dictConfig(logging_config)
+def initialize_logging(process_name: str = None) -> None:
+    """Initialyze logging"""
+    global logging_initialized
+    if not logging_initialized:
+        configure_logging(process_name)
+        logging_initialized = True
 # I would prefer to leave code to use logging.getLogger(), but there are a lot of complicated situations
 # in MindsDB with processes being spawned that require logging to be configured again in a lot of cases.
 # Using a custom logger-getter like this lets us do that logic here, once.
@@ -122,9 +135,5 @@ def getLogger(name=None):
     """
     Get a new logger, configuring logging first if it hasn't been done yet.
     """
-    global logging_initialized
-    if not logging_initialized:
-        configure_logging()
-        logging_initialized = True
+    initialize_logging()
     return logging.getLogger(name)

mindsdb/utilities/ml_task_queue/task.py CHANGED Viewed

@@ -8,14 +8,14 @@ from mindsdb.utilities.ml_task_queue.const import ML_TASK_STATUS
 class Task:
-    """ Abstraction for ML task. Should have interface similat to concurrent.futures.Future
+    """Abstraction for ML task. Should have interface similat to concurrent.futures.Future
-        Attributes:
-            db (Redis): database object
-            redis_key (RedisKey): redis keys associated with task
-            dataframe (DataFrame): task result
-            exception (Exception): task exeuton  runtime exception
-            _timeout (int): max time without status updating
+    Attributes:
+        db (Redis): database object
+        redis_key (RedisKey): redis keys associated with task
+        dataframe (DataFrame): task result
+        exception (Exception): task exeuton  runtime exception
+        _timeout (int): max time without status updating
     """
     def __init__(self, connection: redis.Redis, redis_key: RedisKey) -> None:
@@ -23,18 +23,17 @@ class Task:
         self.redis_key = redis_key
         self.dataframe = None
         self.exception = None
-        self._timeout = 30
+        self._timeout = 60
     def subscribe(self) -> ML_TASK_STATUS:
-        """ return tasks status untill it is not done or failed
-        """
+        """return tasks status untill it is not done or failed"""
         pubsub = self.db.pubsub()
         cache = self.db.cache()
         pubsub.subscribe(self.redis_key.status)
-        while (msg := pubsub.get_message(timeout=self._timeout)):
-            if msg['type'] not in pubsub.PUBLISH_MESSAGE_TYPES:
+        while msg := pubsub.get_message(timeout=self._timeout):
+            if msg["type"] not in pubsub.PUBLISH_MESSAGE_TYPES:
                 continue
-            ml_task_status = ML_TASK_STATUS(msg['data'])
+            ml_task_status = ML_TASK_STATUS(msg["data"])
             if ml_task_status == ML_TASK_STATUS.COMPLETE:
                 dataframe_bytes = cache.get(self.redis_key.dataframe)
                 if dataframe_bytes is not None:
@@ -51,8 +50,7 @@ class Task:
             yield ml_task_status
     def wait(self, status: ML_TASK_STATUS = ML_TASK_STATUS.COMPLETE) -> None:
-        """ block threasd untill task is not done or failed
-        """
+        """block threasd untill task is not done or failed"""
         for status in self.subscribe():
             if status in (ML_TASK_STATUS.WAITING, ML_TASK_STATUS.PROCESSING):
                 continue
@@ -60,23 +58,22 @@ class Task:
                 if self.exception is not None:
                     raise self.exception
                 else:
-                    raise Exception('Unknown error during ML task execution')
+                    raise Exception("Unknown error during ML task execution")
             if status == ML_TASK_STATUS.TIMEOUT:
                 raise Exception(f"Can't get answer in {self._timeout} seconds")
             if status == ML_TASK_STATUS.COMPLETE:
                 return
-            raise KeyError('Unknown task status')
+            raise KeyError("Unknown task status")
     def result(self) -> DataFrame:
-        """ wait task is done and return result
+        """wait task is done and return result
-            Returns:
-                DataFrame: task result
+        Returns:
+            DataFrame: task result
         """
         self.wait()
         return self.dataframe
     def add_done_callback(self, fn: Callable) -> None:
-        """ need for compatability with concurrent.futures.Future interface
-        """
+        """need for compatability with concurrent.futures.Future interface"""
         pass

MindsDB 25.5.4.2__py3-none-any.whl → 25.6.3.0__py3-none-any.whl

Potentially problematic release.

MindsDB 25.5.4.2py3-none-any.whl → 25.6.3.0py3-none-any.whl