PyPI - MindsDB - Versions diffs - 25.7.2.0__py3-none-any.whl → 25.7.4.0__py3-none-any.whl - Mend

MindsDB 25.7.2.0py3-none-any.whl → 25.7.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of MindsDB might be problematic. Click here for more details.

Files changed (69) hide show

mindsdb/__about__.py +1 -1
mindsdb/__main__.py +1 -1
mindsdb/api/a2a/common/server/server.py +16 -6
mindsdb/api/executor/command_executor.py +213 -137
mindsdb/api/executor/datahub/datanodes/integration_datanode.py +5 -1
mindsdb/api/executor/datahub/datanodes/project_datanode.py +14 -3
mindsdb/api/executor/planner/plan_join.py +3 -0
mindsdb/api/executor/planner/plan_join_ts.py +117 -100
mindsdb/api/executor/planner/query_planner.py +1 -0
mindsdb/api/executor/sql_query/steps/apply_predictor_step.py +54 -85
mindsdb/api/http/initialize.py +16 -43
mindsdb/api/http/namespaces/agents.py +24 -21
mindsdb/api/http/namespaces/chatbots.py +83 -120
mindsdb/api/http/namespaces/file.py +1 -1
mindsdb/api/http/namespaces/jobs.py +38 -60
mindsdb/api/http/namespaces/tree.py +69 -61
mindsdb/api/mcp/start.py +2 -0
mindsdb/api/mysql/mysql_proxy/utilities/dump.py +3 -2
mindsdb/integrations/handlers/autogluon_handler/requirements.txt +1 -1
mindsdb/integrations/handlers/autosklearn_handler/requirements.txt +1 -1
mindsdb/integrations/handlers/bigquery_handler/bigquery_handler.py +25 -5
mindsdb/integrations/handlers/chromadb_handler/chromadb_handler.py +3 -3
mindsdb/integrations/handlers/flaml_handler/requirements.txt +1 -1
mindsdb/integrations/handlers/google_calendar_handler/google_calendar_tables.py +82 -73
mindsdb/integrations/handlers/hubspot_handler/requirements.txt +1 -1
mindsdb/integrations/handlers/langchain_handler/langchain_handler.py +83 -76
mindsdb/integrations/handlers/lightwood_handler/requirements.txt +4 -4
mindsdb/integrations/handlers/litellm_handler/litellm_handler.py +16 -3
mindsdb/integrations/handlers/litellm_handler/settings.py +2 -1
mindsdb/integrations/handlers/llama_index_handler/requirements.txt +1 -1
mindsdb/integrations/handlers/pgvector_handler/pgvector_handler.py +106 -90
mindsdb/integrations/handlers/postgres_handler/postgres_handler.py +41 -39
mindsdb/integrations/handlers/s3_handler/s3_handler.py +72 -70
mindsdb/integrations/handlers/salesforce_handler/constants.py +208 -0
mindsdb/integrations/handlers/salesforce_handler/salesforce_handler.py +142 -81
mindsdb/integrations/handlers/salesforce_handler/salesforce_tables.py +12 -4
mindsdb/integrations/handlers/slack_handler/slack_tables.py +141 -161
mindsdb/integrations/handlers/tpot_handler/requirements.txt +1 -1
mindsdb/integrations/handlers/web_handler/urlcrawl_helpers.py +32 -17
mindsdb/integrations/handlers/web_handler/web_handler.py +19 -22
mindsdb/integrations/handlers/youtube_handler/youtube_tables.py +183 -55
mindsdb/integrations/libs/vectordatabase_handler.py +10 -1
mindsdb/integrations/utilities/handler_utils.py +32 -12
mindsdb/interfaces/agents/agents_controller.py +169 -110
mindsdb/interfaces/agents/langchain_agent.py +10 -3
mindsdb/interfaces/data_catalog/data_catalog_loader.py +22 -8
mindsdb/interfaces/database/database.py +38 -13
mindsdb/interfaces/database/integrations.py +20 -5
mindsdb/interfaces/database/projects.py +63 -16
mindsdb/interfaces/database/views.py +86 -60
mindsdb/interfaces/jobs/jobs_controller.py +103 -110
mindsdb/interfaces/knowledge_base/controller.py +33 -5
mindsdb/interfaces/knowledge_base/evaluate.py +53 -9
mindsdb/interfaces/knowledge_base/executor.py +24 -0
mindsdb/interfaces/knowledge_base/llm_client.py +3 -3
mindsdb/interfaces/knowledge_base/preprocessing/document_preprocessor.py +21 -13
mindsdb/interfaces/query_context/context_controller.py +100 -133
mindsdb/interfaces/skills/skills_controller.py +18 -6
mindsdb/interfaces/storage/db.py +40 -6
mindsdb/interfaces/variables/variables_controller.py +8 -15
mindsdb/utilities/config.py +3 -3
mindsdb/utilities/functions.py +72 -60
mindsdb/utilities/log.py +38 -6
mindsdb/utilities/ps.py +7 -7
{mindsdb-25.7.2.0.dist-info → mindsdb-25.7.4.0.dist-info}/METADATA +262 -263
{mindsdb-25.7.2.0.dist-info → mindsdb-25.7.4.0.dist-info}/RECORD +69 -68
{mindsdb-25.7.2.0.dist-info → mindsdb-25.7.4.0.dist-info}/WHEEL +0 -0
{mindsdb-25.7.2.0.dist-info → mindsdb-25.7.4.0.dist-info}/licenses/LICENSE +0 -0
{mindsdb-25.7.2.0.dist-info → mindsdb-25.7.4.0.dist-info}/top_level.txt +0 -0

mindsdb/integrations/handlers/salesforce_handler/salesforce_handler.py CHANGED Viewed

@@ -11,6 +11,7 @@ from mindsdb.integrations.libs.response import (
     RESPONSE_TYPE,
 )
 from mindsdb.integrations.handlers.salesforce_handler.salesforce_tables import create_table_class
+from mindsdb.integrations.handlers.salesforce_handler.constants import get_soql_instructions
 from mindsdb.utilities import log
@@ -72,7 +73,7 @@ class SalesforceHandler(MetaAPIHandler):
             resource_tables = self._get_resource_names()
             for resource_name in resource_tables:
-                table_class = create_table_class(resource_name)
+                table_class = create_table_class(resource_name.lower())
                 self._register_table(resource_name, table_class(self))
             return self.connection
@@ -156,91 +157,152 @@ class SalesforceHandler(MetaAPIHandler):
     def _get_resource_names(self) -> List[str]:
         """
-        Retrieves the names of the Salesforce resources, with more aggressive filtering to remove tables.
+        Retrieves the names of the Salesforce resources with optimized pre-filtering.
         Returns:
             List[str]: A list of filtered resource names.
         """
         if not self.resource_names:
-            all_resources = [
-                resource["name"]
-                for resource in self.connection.sobjects.describe()["sobjects"]
-                if resource.get("queryable", False)
-            ]
+            # Check for user-specified table filtering first
+            include_tables = self.connection_data.get("include_tables") or self.connection_data.get("tables")
+            exclude_tables = self.connection_data.get("exclude_tables", [])
+            if include_tables:
+                # OPTIMIZATION: Skip expensive global describe() call
+                # Only validate the specified tables
+                logger.info(f"Using pre-filtered table list: {include_tables}")
+                self.resource_names = self._validate_specified_tables(include_tables, exclude_tables)
+            else:
+                # Fallback to full discovery with hard-coded filtering
+                logger.info("No table filter specified, performing full discovery...")
+                self.resource_names = self._discover_all_tables_with_filtering(exclude_tables)
-            # Define patterns for tables to be filtered out.
-            # Expanded suffixes and prefixes and exact matches
-            ignore_suffixes = ("Share", "History", "Feed", "ChangeEvent", "Tag", "Permission", "Setup", "Consent")
-            ignore_prefixes = (
-                "Apex",
-                "CommPlatform",
-                "Lightning",
-                "Flow",
-                "Transaction",
-                "AI",
-                "Aura",
-                "ContentWorkspace",
-                "Collaboration",
-                "Datacloud",
-            )
-            ignore_exact = {
-                "EntityDefinition",
-                "FieldDefinition",
-                "RecordType",
-                "CaseStatus",
-                "UserRole",
-                "UserLicense",
-                "UserPermissionAccess",
-                "UserRecordAccess",
-                "Folder",
-                "Group",
-                "Note",
-                "ProcessDefinition",
-                "ProcessInstance",
-                "ContentFolder",
-                "ContentDocumentSubscription",
-                "DashboardComponent",
-                "Report",
-                "Dashboard",
-                "Topic",
-                "TopicAssignment",
-                "Period",
-                "Partner",
-                "PackageLicense",
-                "ColorDefinition",
-                "DataUsePurpose",
-                "DataUseLegalBasis",
-            }
-            ignore_substrings = (
-                "CleanInfo",
-                "Template",
-                "Rule",
-                "Definition",
-                "Status",
-                "Policy",
-                "Setting",
-                "Access",
-                "Config",
-                "Subscription",
-                "DataType",
-                "MilestoneType",
-                "Entitlement",
-                "Auth",
-            )
-            filtered = []
-            for r in all_resources:
-                if (
-                    not r.endswith(ignore_suffixes)
-                    and not r.startswith(ignore_prefixes)
-                    and not any(sub in r for sub in ignore_substrings)
-                    and r not in ignore_exact
-                ):
-                    filtered.append(r)
-            self.resource_names = [r for r in filtered]
         return self.resource_names
+    def _validate_specified_tables(self, include_tables: List[str], exclude_tables: List[str]) -> List[str]:
+        """
+        Validate user-specified tables without expensive global describe() call.
+        Args:
+            include_tables: List of table names to include
+            exclude_tables: List of table names to exclude
+        Returns:
+            List[str]: Validated and filtered table names
+        """
+        validated_tables = []
+        for table_name in include_tables:
+            # Skip if explicitly excluded
+            if table_name in exclude_tables:
+                logger.info(f"Skipping excluded table: {table_name}")
+                continue
+            try:
+                # Quick validation: check if table exists and is queryable
+                # This is much faster than global describe()
+                metadata = getattr(self.connection.sobjects, table_name).describe()
+                if metadata.get("queryable", False):
+                    validated_tables.append(table_name)
+                    logger.debug(f"Validated table: {table_name}")
+                else:
+                    logger.warning(f"Table {table_name} is not queryable, skipping")
+            except Exception as e:
+                logger.warning(f"Table {table_name} not found or accessible: {e}")
+        logger.info(f"Validated {len(validated_tables)} tables from include_tables")
+        return validated_tables
+    def _discover_all_tables_with_filtering(self, exclude_tables: List[str]) -> List[str]:
+        """
+        Fallback method: discover all tables with hard-coded filtering.
+        Args:
+            exclude_tables: List of table names to exclude
+        Returns:
+            List[str]: Filtered table names
+        """
+        # This is the original expensive approach - only used when no include_tables specified
+        all_resources = [
+            resource["name"]
+            for resource in self.connection.sobjects.describe()["sobjects"]
+            if resource.get("queryable", False)
+        ]
+        # Apply hard-coded filtering (existing logic)
+        ignore_suffixes = ("Share", "History", "Feed", "ChangeEvent", "Tag", "Permission", "Setup", "Consent")
+        ignore_prefixes = (
+            "Apex",
+            "CommPlatform",
+            "Lightning",
+            "Flow",
+            "Transaction",
+            "AI",
+            "Aura",
+            "ContentWorkspace",
+            "Collaboration",
+            "Datacloud",
+        )
+        ignore_exact = {
+            "EntityDefinition",
+            "FieldDefinition",
+            "RecordType",
+            "CaseStatus",
+            "UserRole",
+            "UserLicense",
+            "UserPermissionAccess",
+            "UserRecordAccess",
+            "Folder",
+            "Group",
+            "Note",
+            "ProcessDefinition",
+            "ProcessInstance",
+            "ContentFolder",
+            "ContentDocumentSubscription",
+            "DashboardComponent",
+            "Report",
+            "Dashboard",
+            "Topic",
+            "TopicAssignment",
+            "Period",
+            "Partner",
+            "PackageLicense",
+            "ColorDefinition",
+            "DataUsePurpose",
+            "DataUseLegalBasis",
+        }
+        ignore_substrings = (
+            "CleanInfo",
+            "Template",
+            "Rule",
+            "Definition",
+            "Status",
+            "Policy",
+            "Setting",
+            "Access",
+            "Config",
+            "Subscription",
+            "DataType",
+            "MilestoneType",
+            "Entitlement",
+            "Auth",
+        )
+        # Apply hard-coded filtering
+        filtered = []
+        for r in all_resources:
+            if (
+                not r.endswith(ignore_suffixes)
+                and not r.startswith(ignore_prefixes)
+                and not any(sub in r for sub in ignore_substrings)
+                and r not in ignore_exact
+                and r not in exclude_tables  # Apply user exclusions
+            ):
+                filtered.append(r)
+        return filtered
     def meta_get_handler_info(self, **kwargs) -> str:
         """
         Retrieves information about the design and implementation of the API handler.
@@ -254,8 +316,7 @@ class SalesforceHandler(MetaAPIHandler):
         Returns:
             str: A string containing information about the API handler's design and implementation.
         """
-        # TODO: Relationships? Aliases?
-        return "When filtering on a Date or DateTime field, the value MUST be an unquoted literal in YYYY-MM-DD or YYYY-MM-DDThh:mm:ssZ format. For example, CloseDate >= 2025-05-28 is correct; CloseDate >= '2025-05-28' is incorrect."
+        return get_soql_instructions(self.name)
     def meta_get_tables(self, table_names: Optional[List[str]] = None) -> Response:
         """

mindsdb/integrations/handlers/salesforce_handler/salesforce_tables.py CHANGED Viewed

@@ -164,10 +164,18 @@ def create_table_class(resource_name: Text) -> MetaAPIResource:
             """
             client = self.handler.connect()
-            resource_metadata = next(
-                (resource for resource in main_metadata if resource["name"].lower() == resource_name),
-            )
+            try:
+                resource_metadata = next(
+                    (resource for resource in main_metadata if resource["name"].lower() == resource_name),
+                )
+            except Exception as e:
+                logger.warning(f"Failed to get resource metadata for {resource_name}: {e}")
+                return {
+                    "table_name": table_name,
+                    "table_type": "BASE TABLE",
+                    "table_description": "",
+                    "row_count": None,
+                }
             # Get row count if Id column is aggregatable.
             row_count = None
             # if next(field for field in resource_metadata['fields'] if field['name'] == 'Id').get('aggregatable', False):

MindsDB 25.7.2.0__py3-none-any.whl → 25.7.4.0__py3-none-any.whl

Potentially problematic release.

MindsDB 25.7.2.0py3-none-any.whl → 25.7.4.0py3-none-any.whl