PyPI - MindsDB - Versions diffs - 25.5.4.2__py3-none-any.whl → 25.6.3.0__py3-none-any.whl - Mend

MindsDB 25.5.4.2py3-none-any.whl → 25.6.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of MindsDB might be problematic. Click here for more details.

Files changed (76) hide show

mindsdb/__about__.py +1 -1
mindsdb/api/a2a/agent.py +50 -26
mindsdb/api/a2a/common/server/server.py +32 -26
mindsdb/api/a2a/task_manager.py +68 -6
mindsdb/api/executor/command_executor.py +69 -14
mindsdb/api/executor/datahub/datanodes/integration_datanode.py +49 -65
mindsdb/api/executor/datahub/datanodes/mindsdb_tables.py +91 -84
mindsdb/api/executor/datahub/datanodes/project_datanode.py +29 -48
mindsdb/api/executor/datahub/datanodes/system_tables.py +35 -61
mindsdb/api/executor/planner/plan_join.py +67 -77
mindsdb/api/executor/planner/query_planner.py +176 -155
mindsdb/api/executor/planner/steps.py +37 -12
mindsdb/api/executor/sql_query/result_set.py +45 -64
mindsdb/api/executor/sql_query/steps/fetch_dataframe.py +14 -18
mindsdb/api/executor/sql_query/steps/fetch_dataframe_partition.py +17 -18
mindsdb/api/executor/sql_query/steps/insert_step.py +13 -33
mindsdb/api/executor/sql_query/steps/subselect_step.py +43 -35
mindsdb/api/executor/utilities/sql.py +42 -48
mindsdb/api/http/namespaces/config.py +1 -1
mindsdb/api/http/namespaces/file.py +14 -23
mindsdb/api/http/namespaces/knowledge_bases.py +132 -154
mindsdb/api/mysql/mysql_proxy/data_types/mysql_datum.py +12 -28
mindsdb/api/mysql/mysql_proxy/data_types/mysql_packets/binary_resultset_row_package.py +59 -50
mindsdb/api/mysql/mysql_proxy/data_types/mysql_packets/resultset_row_package.py +9 -8
mindsdb/api/mysql/mysql_proxy/libs/constants/mysql.py +449 -461
mindsdb/api/mysql/mysql_proxy/utilities/dump.py +87 -36
mindsdb/integrations/handlers/bigquery_handler/bigquery_handler.py +219 -28
mindsdb/integrations/handlers/file_handler/file_handler.py +15 -9
mindsdb/integrations/handlers/file_handler/tests/test_file_handler.py +43 -24
mindsdb/integrations/handlers/litellm_handler/litellm_handler.py +10 -3
mindsdb/integrations/handlers/llama_index_handler/requirements.txt +1 -1
mindsdb/integrations/handlers/mysql_handler/mysql_handler.py +29 -33
mindsdb/integrations/handlers/openai_handler/openai_handler.py +277 -356
mindsdb/integrations/handlers/oracle_handler/oracle_handler.py +74 -51
mindsdb/integrations/handlers/postgres_handler/postgres_handler.py +305 -98
mindsdb/integrations/handlers/salesforce_handler/salesforce_handler.py +145 -40
mindsdb/integrations/handlers/salesforce_handler/salesforce_tables.py +136 -6
mindsdb/integrations/handlers/snowflake_handler/snowflake_handler.py +352 -83
mindsdb/integrations/libs/api_handler.py +279 -57
mindsdb/integrations/libs/base.py +185 -30
mindsdb/integrations/utilities/files/file_reader.py +99 -73
mindsdb/integrations/utilities/handler_utils.py +23 -8
mindsdb/integrations/utilities/sql_utils.py +35 -40
mindsdb/interfaces/agents/agents_controller.py +226 -196
mindsdb/interfaces/agents/constants.py +8 -1
mindsdb/interfaces/agents/langchain_agent.py +42 -11
mindsdb/interfaces/agents/mcp_client_agent.py +29 -21
mindsdb/interfaces/agents/mindsdb_database_agent.py +23 -18
mindsdb/interfaces/data_catalog/__init__.py +0 -0
mindsdb/interfaces/data_catalog/base_data_catalog.py +54 -0
mindsdb/interfaces/data_catalog/data_catalog_loader.py +375 -0
mindsdb/interfaces/data_catalog/data_catalog_reader.py +38 -0
mindsdb/interfaces/database/database.py +81 -57
mindsdb/interfaces/database/integrations.py +222 -234
mindsdb/interfaces/database/log.py +72 -104
mindsdb/interfaces/database/projects.py +156 -193
mindsdb/interfaces/file/file_controller.py +21 -65
mindsdb/interfaces/knowledge_base/controller.py +66 -25
mindsdb/interfaces/knowledge_base/evaluate.py +516 -0
mindsdb/interfaces/knowledge_base/llm_client.py +75 -0
mindsdb/interfaces/skills/custom/text2sql/mindsdb_kb_tools.py +83 -43
mindsdb/interfaces/skills/skills_controller.py +31 -36
mindsdb/interfaces/skills/sql_agent.py +113 -86
mindsdb/interfaces/storage/db.py +242 -82
mindsdb/migrations/versions/2025-05-28_a44643042fe8_added_data_catalog_tables.py +118 -0
mindsdb/migrations/versions/2025-06-09_608e376c19a7_updated_data_catalog_data_types.py +58 -0
mindsdb/utilities/config.py +13 -2
mindsdb/utilities/log.py +35 -26
mindsdb/utilities/ml_task_queue/task.py +19 -22
mindsdb/utilities/render/sqlalchemy_render.py +129 -181
mindsdb/utilities/starters.py +40 -0
{mindsdb-25.5.4.2.dist-info → mindsdb-25.6.3.0.dist-info}/METADATA +257 -257
{mindsdb-25.5.4.2.dist-info → mindsdb-25.6.3.0.dist-info}/RECORD +76 -68
{mindsdb-25.5.4.2.dist-info → mindsdb-25.6.3.0.dist-info}/WHEEL +0 -0
{mindsdb-25.5.4.2.dist-info → mindsdb-25.6.3.0.dist-info}/licenses/LICENSE +0 -0
{mindsdb-25.5.4.2.dist-info → mindsdb-25.6.3.0.dist-info}/top_level.txt +0 -0

mindsdb/integrations/handlers/file_handler/tests/test_file_handler.py CHANGED Viewed

@@ -7,12 +7,22 @@ from pathlib import Path
 import pandas
 import pytest
 from mindsdb_sql_parser.exceptions import ParsingException
-from mindsdb_sql_parser.ast import CreateTable, DropTables, Identifier, Insert, TableColumn, Update
+from mindsdb_sql_parser.ast import (
+    CreateTable,
+    DropTables,
+    Identifier,
+    Insert,
+    TableColumn,
+    Update,
+)
 from mindsdb.integrations.handlers.file_handler.file_handler import FileHandler
 from mindsdb.integrations.libs.response import RESPONSE_TYPE
-from mindsdb.integrations.utilities.files.file_reader import FileReader
+from mindsdb.integrations.utilities.files.file_reader import (
+    FileReader,
+    FileProcessingError,
+)
 # Define a table to use as content for all of the file types
@@ -103,21 +113,18 @@ class TestIsItX:
     def test_is_it_csv(self):
         # We can't test xlsx or parquet here because they're binary files
-        for file_path, result in (
-            (csv_file(), True),
-            (json_file(), False)
-        ):
+        for file_path, result in ((csv_file(), True), (json_file(), False)):
             with open(file_path, "r") as fh:
                 assert FileReader.is_csv(StringIO(fh.read())) is result
     def test_format(self):
         for file_path, result in (
-            (csv_file(), 'csv'),
-            (xlsx_file(), 'xlsx'),
-            (json_file(), 'json'),
-            (parquet_file(), 'parquet'),
-            (txt_file(), 'txt'),
-            (pdf_file(), 'pdf'),
+            (csv_file(), "csv"),
+            (xlsx_file(), "xlsx"),
+            (json_file(), "json"),
+            (parquet_file(), "parquet"),
+            (txt_file(), "txt"),
+            (pdf_file(), "pdf"),
         ):
             assert FileReader(path=file_path).get_format() == result
@@ -182,6 +189,7 @@ class TestQuery:
         def mock_get_file_path(self, name):
             return csv_tmp
         monkeypatch.setattr(MockFileController, "get_file_path", mock_get_file_path)
         file_handler = FileHandler(file_controller=MockFileController())
@@ -255,14 +263,13 @@ class TestQuery:
 def test_handle_source():
     def get_reader(file_path):
         # using path
         reader = FileReader(path=file_path)
         yield reader
         # using file descriptor
-        with open(file_path, 'rb') as fd:
+        with open(file_path, "rb") as fd:
             reader = FileReader(file=fd)
             yield reader
             fd.seek(0)
@@ -310,14 +317,31 @@ def test_check_valid_dialects(csv_string, delimiter):
 def test_tsv():
     file = BytesIO(b"example;csv;file\tname")
-    reader = FileReader(file=file, name='test.tsv')
-    assert reader.get_format() == 'csv'
-    assert reader.parameters['delimiter'] == '\t'
+    reader = FileReader(file=file, name="test.tsv")
+    assert reader.get_format() == "csv"
+    assert reader.parameters["delimiter"] == "\t"
     df = reader.get_page_content()
     assert len(df.columns) == 2
+def test_bad_csv_header():
+    file = BytesIO(b" a,b  ,c\n1,2,3\n")
+    reader = FileReader(file=file, name="test.tsv")
+    df = reader.get_page_content()
+    assert set(df.columns) == set(["a", "b", "c"])
+    wrong_data = [
+        b"a, ,c\n1,2,3\n",
+        b"a,  \t,c\n1,2,3\n",
+        b"   ,b,c\n1,2,3\n",
+    ]
+    for data in wrong_data:
+        reader = FileReader(file=BytesIO(data), name="test.tsv")
+        with pytest.raises(FileProcessingError):
+            df = reader.get_page_content()
 def test_check_invalid_dialects():
     with pytest.raises(Exception):
         FileHandler._get_csv_dialect("example csv file")
@@ -334,10 +358,7 @@ def test_get_tables():
     assert response.type == RESPONSE_TYPE.TABLE
     expected_df = pandas.DataFrame(
-        [
-            {"TABLE_NAME": x[0], "TABLE_ROWS": x[1], "TABLE_TYPE": "BASE TABLE"}
-            for x in file_records
-        ]
+        [{"TABLE_NAME": x[0], "TABLE_ROWS": x[1], "TABLE_TYPE": "BASE TABLE"} for x in file_records]
     )
     assert response.data_frame.equals(expected_df)
@@ -349,8 +370,6 @@ def test_get_columns():
     assert response.type == RESPONSE_TYPE.TABLE
-    expected_df = pandas.DataFrame(
-        [{"Field": x, "Type": "str"} for x in file_records[0][2]]
-    )
+    expected_df = pandas.DataFrame([{"Field": x, "Type": "str"} for x in file_records[0][2]])
     assert response.data_frame.equals(expected_df)

mindsdb/integrations/handlers/litellm_handler/litellm_handler.py CHANGED Viewed

@@ -2,7 +2,7 @@ import ast
 from typing import Dict, Optional, List
-from litellm import completion, batch_completion, embedding
+from litellm import completion, batch_completion, embedding, acompletion
 import pandas as pd
 from mindsdb.integrations.libs.base import BaseMLEngine
@@ -42,10 +42,17 @@ class LiteLLMHandler(BaseMLEngine):
                 f"https://{args['snowflake_account_id']}.snowflakecomputing.com/api/v2/cortex/inference:complete"
             )
-        from litellm import acompletion
         return await acompletion(model=model, messages=messages, stream=False, **args)
+    @staticmethod
+    def completion(model: str, messages: List[dict], args: dict):
+        if model.startswith("snowflake/") and "snowflake_account_id" in args:
+            args["api_base"] = (
+                f"https://{args['snowflake_account_id']}.snowflakecomputing.com/api/v2/cortex/inference:complete"
+            )
+        return completion(model=model, messages=messages, stream=False, **args)
     def create(
         self,
         target: str,

mindsdb/integrations/handlers/llama_index_handler/requirements.txt CHANGED Viewed

@@ -1,4 +1,4 @@
-llama-index==0.12.21
+llama-index==0.12.28
 pydantic-settings >= 2.1.0
 llama-index-readers-web
 llama-index-embeddings-openai

mindsdb/integrations/handlers/mysql_handler/mysql_handler.py CHANGED Viewed

@@ -31,9 +31,7 @@ def _map_type(mysql_type_text: str) -> MYSQL_DATA_TYPE:
     try:
         return MYSQL_DATA_TYPE(mysql_type_text.upper())
     except Exception:
-        logger.warning(
-            f"MySQL handler: unknown type: {mysql_type_text}, use TEXT as fallback."
-        )
+        logger.warning(f"MySQL handler: unknown type: {mysql_type_text}, use TEXT as fallback.")
         return MYSQL_DATA_TYPE.TEXT
@@ -65,22 +63,23 @@ def _make_table_response(result: list[dict], cursor: mysql.connector.cursor.MySQ
             mysql_types.append(reverse_c_type_map[type_int])
             continue
-        if type_int != C_TYPES.MYSQL_TYPE_BLOB:
-            raise ValueError(f'Unknown MySQL type id={type_int} in column {col[0]}')
-        # region determine text/blob type by flags
-        # Unfortunately, there is no way to determine particular type of text/blob column by flags.
-        # Subtype have to be determined by 8-s element of description tuple, but mysql.conector
-        # return the same value for all text types (TINYTEXT, TEXT, MEDIUMTEXT, LONGTEXT), and for
-        # all blob types (TINYBLOB, BLOB, MEDIUMBLOB, LONGBLOB).
-        if col[7] == 16:  # and col[8] == 45
-            mysql_types.append(MYSQL_DATA_TYPE.TEXT)
-        elif col[7] == 144:  # and col[8] == 63
-            mysql_types.append(MYSQL_DATA_TYPE.BLOB)
+        if type_int == C_TYPES.MYSQL_TYPE_BLOB:
+            # region determine text/blob type by flags
+            # Unfortunately, there is no way to determine particular type of text/blob column by flags.
+            # Subtype have to be determined by 8-s element of description tuple, but mysql.conector
+            # return the same value for all text types (TINYTEXT, TEXT, MEDIUMTEXT, LONGTEXT), and for
+            # all blob types (TINYBLOB, BLOB, MEDIUMBLOB, LONGBLOB).
+            if col[7] == 16:  # and col[8] == 45
+                mysql_types.append(MYSQL_DATA_TYPE.TEXT)
+            elif col[7] == 144:  # and col[8] == 63
+                mysql_types.append(MYSQL_DATA_TYPE.BLOB)
+            else:
+                logger.debug(f"MySQL handler: unknown type code {col[7]}, use TEXT as fallback.")
+                mysql_types.append(MYSQL_DATA_TYPE.TEXT)
+            # endregion
         else:
-            logger.debug(f'MySQL handler: unknown type code {col[7]}, use TEXT as fallback.')
+            logger.warning(f"MySQL handler: unknown type id={type_int} in column {col[0]}, use TEXT as fallback.")
             mysql_types.append(MYSQL_DATA_TYPE.TEXT)
-        # endregion
     # region cast int and bool to nullable types
     serieses = []
@@ -88,22 +87,20 @@ def _make_table_response(result: list[dict], cursor: mysql.connector.cursor.MySQ
         expected_dtype = None
         column_name = description[i][0]
         if mysql_type in (
-            MYSQL_DATA_TYPE.SMALLINT, MYSQL_DATA_TYPE.INT, MYSQL_DATA_TYPE.MEDIUMINT,
-            MYSQL_DATA_TYPE.BIGINT, MYSQL_DATA_TYPE.TINYINT
+            MYSQL_DATA_TYPE.SMALLINT,
+            MYSQL_DATA_TYPE.INT,
+            MYSQL_DATA_TYPE.MEDIUMINT,
+            MYSQL_DATA_TYPE.BIGINT,
+            MYSQL_DATA_TYPE.TINYINT,
         ):
-            expected_dtype = 'Int64'
+            expected_dtype = "Int64"
         elif mysql_type in (MYSQL_DATA_TYPE.BOOL, MYSQL_DATA_TYPE.BOOLEAN):
-            expected_dtype = 'boolean'
+            expected_dtype = "boolean"
         serieses.append(pd.Series([row[column_name] for row in result], dtype=expected_dtype, name=description[i][0]))
     df = pd.concat(serieses, axis=1, copy=False)
     # endregion
-    response = Response(
-        RESPONSE_TYPE.TABLE,
-        df,
-        affected_rows=cursor.rowcount,
-        mysql_types=mysql_types
-    )
+    response = Response(RESPONSE_TYPE.TABLE, df, affected_rows=cursor.rowcount, mysql_types=mysql_types)
     return response
@@ -182,6 +179,9 @@ class MySQLHandler(DatabaseHandler):
                 config["ssl_cert"] = ssl_cert
             if ssl_key is not None:
                 config["ssl_key"] = ssl_key
+        elif ssl is False:
+            config["ssl_disabled"] = True
         if "collation" not in config:
             config["collation"] = "utf8mb4_general_ci"
         if "use_pure" not in config:
@@ -219,9 +219,7 @@ class MySQLHandler(DatabaseHandler):
             connection = self.connect()
             result.success = connection.is_connected()
         except mysql.connector.Error as e:
-            logger.error(
-                f'Error connecting to MySQL {self.connection_data["database"]}, {e}!'
-            )
+            logger.error(f"Error connecting to MySQL {self.connection_data['database']}, {e}!")
             result.error_message = str(e)
         if result.success and need_to_close:
@@ -252,9 +250,7 @@ class MySQLHandler(DatabaseHandler):
                 else:
                     response = Response(RESPONSE_TYPE.OK, affected_rows=cur.rowcount)
         except mysql.connector.Error as e:
-            logger.error(
-                f'Error running query: {query} on {self.connection_data["database"]}!'
-            )
+            logger.error(f"Error running query: {query} on {self.connection_data['database']}!")
             response = Response(RESPONSE_TYPE.ERROR, error_message=str(e))
             if connection is not None and connection.is_connected():
                 connection.rollback()

MindsDB 25.5.4.2__py3-none-any.whl → 25.6.3.0__py3-none-any.whl

Potentially problematic release.

MindsDB 25.5.4.2py3-none-any.whl → 25.6.3.0py3-none-any.whl