PyPI - sdg-hub - Versions diffs - 0.7.2__py3-none-any.whl → 0.8.0__py3-none-any.whl - Mend

sdg-hub 0.7.2py3-none-any.whl → 0.8.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (43) hide show

sdg_hub/core/connectors/http/client.py ADDED Viewed

@@ -0,0 +1,150 @@
+# SPDX-License-Identifier: Apache-2.0
+"""HTTP client with tenacity retry."""
+from typing import Any, Optional
+from tenacity import (
+    retry,
+    retry_if_exception_type,
+    stop_after_attempt,
+    wait_exponential,
+)
+import httpx
+from ...utils.logger_config import setup_logger
+from ..exceptions import ConnectorError, ConnectorHTTPError
+logger = setup_logger(__name__)
+class HttpClient:
+    """HTTP client with tenacity retry.
+    Parameters
+    ----------
+    timeout : float
+        Request timeout in seconds. Default is 120.0.
+    max_retries : int
+        Maximum number of retry attempts. Default is 3.
+    Example
+    -------
+    >>> client = HttpClient(timeout=60.0, max_retries=3)
+    >>> response = await client.post("https://api.example.com", {"key": "value"}, {})
+    """
+    def __init__(self, timeout: float = 120.0, max_retries: int = 3):
+        self.timeout = timeout
+        self.max_retries = max_retries
+    async def post(
+        self,
+        url: str,
+        payload: dict[str, Any],
+        headers: Optional[dict[str, str]] = None,
+    ) -> dict[str, Any]:
+        """Async POST request with retry logic.
+        Parameters
+        ----------
+        url : str
+            The URL to POST to.
+        payload : dict
+            The JSON payload to send.
+        headers : dict, optional
+            HTTP headers to include.
+        Returns
+        -------
+        dict
+            The JSON response.
+        Raises
+        ------
+        ConnectorError
+            If connection or timeout fails after all retries.
+        ConnectorHTTPError
+            If an HTTP error status is returned.
+        """
+        headers = headers or {}
+        @retry(
+            stop=stop_after_attempt(self.max_retries + 1),  # 1 initial + retries
+            wait=wait_exponential(multiplier=1, min=1, max=60),
+            retry=retry_if_exception_type((httpx.TimeoutException, httpx.ConnectError)),
+            reraise=True,
+        )
+        async def _post_with_retry() -> dict[str, Any]:
+            async with httpx.AsyncClient(timeout=self.timeout) as client:
+                logger.debug(f"POST request to {url}")
+                response = await client.post(url, json=payload, headers=headers)
+                response.raise_for_status()
+                return response.json()
+        try:
+            return await _post_with_retry()
+        except httpx.HTTPStatusError as e:
+            response_text = e.response.text[:500] if e.response.text else None
+            raise ConnectorHTTPError(url, e.response.status_code, response_text) from e
+        except httpx.TimeoutException as e:
+            raise ConnectorError(
+                f"Request to '{url}' timed out after {self.timeout}s"
+            ) from e
+        except httpx.ConnectError as e:
+            raise ConnectorError(f"Failed to connect to '{url}': {e}") from e
+    def post_sync(
+        self,
+        url: str,
+        payload: dict[str, Any],
+        headers: Optional[dict[str, str]] = None,
+    ) -> dict[str, Any]:
+        """Synchronous POST request with retry logic.
+        Parameters
+        ----------
+        url : str
+            The URL to POST to.
+        payload : dict
+            The JSON payload to send.
+        headers : dict, optional
+            HTTP headers to include.
+        Returns
+        -------
+        dict
+            The JSON response.
+        Raises
+        ------
+        ConnectorError
+            If connection or timeout fails after all retries.
+        ConnectorHTTPError
+            If an HTTP error status is returned.
+        """
+        headers = headers or {}
+        @retry(
+            stop=stop_after_attempt(self.max_retries + 1),  # 1 initial + retries
+            wait=wait_exponential(multiplier=1, min=1, max=60),
+            retry=retry_if_exception_type((httpx.TimeoutException, httpx.ConnectError)),
+            reraise=True,
+        )
+        def _post_with_retry() -> dict[str, Any]:
+            with httpx.Client(timeout=self.timeout) as client:
+                logger.debug(f"POST request to {url}")
+                response = client.post(url, json=payload, headers=headers)
+                response.raise_for_status()
+                return response.json()
+        try:
+            return _post_with_retry()
+        except httpx.HTTPStatusError as e:
+            response_text = e.response.text[:500] if e.response.text else None
+            raise ConnectorHTTPError(url, e.response.status_code, response_text) from e
+        except httpx.TimeoutException as e:
+            raise ConnectorError(
+                f"Request to '{url}' timed out after {self.timeout}s"
+            ) from e
+        except httpx.ConnectError as e:
+            raise ConnectorError(f"Failed to connect to '{url}': {e}") from e

sdg_hub/core/connectors/registry.py ADDED Viewed

@@ -0,0 +1,112 @@
+# SPDX-License-Identifier: Apache-2.0
+"""Registry for connector classes."""
+import inspect
+from ..utils.logger_config import setup_logger
+from .exceptions import ConnectorError
+logger = setup_logger(__name__)
+class ConnectorRegistry:
+    """Global registry for connector classes.
+    Simple registry for registering and retrieving connectors by name.
+    Example
+    -------
+    >>> @ConnectorRegistry.register("my_connector")
+    ... class MyConnector(BaseConnector):
+    ...     pass
+    ...
+    >>> connector_class = ConnectorRegistry.get("my_connector")
+    """
+    _connectors: dict[str, type] = {}
+    @classmethod
+    def register(cls, name: str):
+        """Register a connector class.
+        Parameters
+        ----------
+        name : str
+            Name under which to register the connector.
+        Returns
+        -------
+        callable
+            Decorator function that registers the class.
+        Example
+        -------
+        >>> @ConnectorRegistry.register("langflow")
+        ... class LangflowConnector(BaseAgentConnector):
+        ...     pass
+        """
+        def decorator(connector_class: type) -> type:
+            # Validate the class
+            if not inspect.isclass(connector_class):
+                raise ConnectorError(f"Expected a class, got {type(connector_class)}")
+            # Check for BaseConnector inheritance
+            from .base import BaseConnector
+            if not issubclass(connector_class, BaseConnector):
+                raise ConnectorError(
+                    f"Connector class '{connector_class.__name__}' "
+                    "must inherit from BaseConnector"
+                )
+            cls._connectors[name] = connector_class
+            logger.debug(f"Registered connector '{name}' ({connector_class.__name__})")
+            return connector_class
+        return decorator
+    @classmethod
+    def get(cls, name: str) -> type:
+        """Get a connector class by name.
+        Parameters
+        ----------
+        name : str
+            Name of the connector to retrieve.
+        Returns
+        -------
+        type
+            The connector class.
+        Raises
+        ------
+        ConnectorError
+            If the connector is not found.
+        """
+        if name not in cls._connectors:
+            available = sorted(cls._connectors.keys())
+            error_msg = f"Connector '{name}' not found."
+            if available:
+                error_msg += f" Available: {', '.join(available)}"
+            raise ConnectorError(error_msg)
+        return cls._connectors[name]
+    @classmethod
+    def list_all(cls) -> list[str]:
+        """Get all registered connector names.
+        Returns
+        -------
+        list[str]
+            Sorted list of all connector names.
+        """
+        return sorted(cls._connectors.keys())
+    @classmethod
+    def clear(cls) -> None:
+        """Clear all registered connectors. Primarily for testing."""
+        cls._connectors.clear()

sdg_hub/core/flow/base.py CHANGED Viewed

@@ -679,7 +679,7 @@ class Flow(BaseModel):
                 self._block_metrics.append(
                     {
                         "block_name": block.block_name,
-                        "block_type": block.__class__.__name__,
+                        "block_class": block.__class__.__name__,
                         "execution_time": execution_time,
                         "input_rows": input_rows,
                         "output_rows": output_rows,
@@ -701,7 +701,7 @@ class Flow(BaseModel):
                 self._block_metrics.append(
                     {
                         "block_name": block.block_name,
-                        "block_type": block.__class__.__name__,
+                        "block_class": block.__class__.__name__,
                         "execution_time": execution_time,
                         "input_rows": input_rows,
                         "output_rows": 0,
@@ -882,38 +882,14 @@ class Flow(BaseModel):
             )
     def _detect_llm_blocks(self) -> list[str]:
-        """Detect LLM blocks in the flow by checking for model-related attribute existence.
-        LLM blocks are identified by having model, api_base, or api_key attributes,
-        regardless of their values (they may be None until set_model_config() is called).
+        """Detect blocks with block_type='llm'.
         Returns
         -------
         List[str]
-            List of block names that have LLM-related attributes.
+            List of block names that are LLM blocks.
         """
-        llm_blocks = []
-        for block in self.blocks:
-            block_type = block.__class__.__name__
-            block_name = block.block_name
-            # Check by attribute existence (not value) - LLM blocks have these attributes even if None
-            has_model_attr = hasattr(block, "model")
-            has_api_base_attr = hasattr(block, "api_base")
-            has_api_key_attr = hasattr(block, "api_key")
-            # A block is considered an LLM block if it has any LLM-related attributes
-            is_llm_block = has_model_attr or has_api_base_attr or has_api_key_attr
-            if is_llm_block:
-                llm_blocks.append(block_name)
-                logger.debug(
-                    f"Detected LLM block '{block_name}' ({block_type}): "
-                    f"has_model_attr={has_model_attr}, has_api_base_attr={has_api_base_attr}, has_api_key_attr={has_api_key_attr}"
-                )
-        return llm_blocks
+        return [block.block_name for block in self.blocks if block.block_type == "llm"]
     def is_model_config_required(self) -> bool:
         """Check if model configuration is required for this flow.
@@ -1152,7 +1128,7 @@ class Flow(BaseModel):
                 # Record block execution info
                 block_info = {
                     "block_name": block.block_name,
-                    "block_type": block.__class__.__name__,
+                    "block_class": block.__class__.__name__,
                     "execution_time_seconds": block_execution_time,
                     "input_rows": input_rows,
                     "output_rows": len(current_dataset),
@@ -1341,7 +1317,7 @@ class Flow(BaseModel):
             "metadata": self.metadata.model_dump(),
             "blocks": [
                 {
-                    "block_type": block.__class__.__name__,
+                    "block_class": block.__class__.__name__,
                     "block_name": block.block_name,
                     "input_cols": getattr(block, "input_cols", None),
                     "output_cols": getattr(block, "output_cols", None),

sdg_hub/core/utils/flow_metrics.py CHANGED Viewed

@@ -31,12 +31,12 @@ def aggregate_block_metrics(entries: list[dict[str, Any]]) -> list[dict[str, Any
     """
     agg: dict[tuple[str, str], dict[str, Any]] = {}
     for m in entries:
-        key = (m.get("block_name"), m.get("block_type"))
+        key = (m.get("block_name"), m.get("block_class"))
         a = agg.setdefault(
             key,
             {
                 "block_name": key[0],
-                "block_type": key[1],
+                "block_class": key[1],
                 "execution_time": 0.0,
                 "input_rows": 0,
                 "output_rows": 0,
@@ -138,7 +138,7 @@ def display_metrics_summary(
         table.add_row(
             metrics["block_name"],
-            metrics["block_type"],
+            metrics["block_class"],
             duration,
             row_change,
             col_change,

sdg_hub/flows/evaluation/rag/flow.yaml CHANGED Viewed

@@ -41,7 +41,7 @@ blocks:
       max_tokens: 2048
       temperature: 0.7
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: parse_topic
       input_cols: topic_response
@@ -73,7 +73,7 @@ blocks:
       max_tokens: 2048
       temperature: 0.7
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: parse_question
       input_cols: question_response
@@ -97,7 +97,7 @@ blocks:
       max_tokens: 4096
       temperature: 0.7
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: parse_evolved_question
       input_cols: evolution_response
@@ -123,7 +123,7 @@ blocks:
       max_tokens: 4096
       temperature: 0.2
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: parse_answer
       input_cols: answer_response
@@ -150,7 +150,7 @@ blocks:
       max_tokens: 512
       temperature: 0.0
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: parse_critic_score
       input_cols: critic_response
@@ -185,7 +185,7 @@ blocks:
       max_tokens: 4096
       temperature: 0.0
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: parse_extracted_context
       input_cols: extraction_response

sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/detailed_summary/flow.yaml CHANGED Viewed

@@ -60,7 +60,7 @@ blocks:
     temperature: 0.7
     n: 50
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_detailed_summary
     input_cols: raw_summary
@@ -108,7 +108,7 @@ blocks:
     temperature: 0.7
     n: 1
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_questions
     input_cols: question_list
@@ -142,7 +142,7 @@ blocks:
     temperature: 0.7
     n: 1
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_answers
     input_cols: response_dict
@@ -174,7 +174,7 @@ blocks:
     output_cols: eval_faithful_response_dict
     n: 1
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_eval_faithful
     input_cols: eval_faithful_response_dict

sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/doc_direct_qa/flow.yaml CHANGED Viewed

@@ -64,7 +64,7 @@ blocks:
     temperature: 1.0
     n: 1
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_questions
     input_cols: question_list
@@ -98,7 +98,7 @@ blocks:
     temperature: 1.0
     n: 1
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_answer
     input_cols: response_dict
@@ -130,7 +130,7 @@ blocks:
     output_cols: eval_faithful_response_dict
     n: 1
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_eval_faithful
     input_cols: eval_faithful_response_dict

sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/extractive_summary/flow.yaml CHANGED Viewed

@@ -62,7 +62,7 @@ blocks:
     temperature: 0.7
     n: 50
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_extractive_summary
     input_cols: raw_summary
@@ -110,7 +110,7 @@ blocks:
     temperature: 0.7
     n: 1
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_questions
     input_cols: question_list
@@ -144,7 +144,7 @@ blocks:
     temperature: 0.7
     n: 1
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_answers
     input_cols: response_dict
@@ -176,7 +176,7 @@ blocks:
     output_cols: eval_faithful_response_dict
     n: 1
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_eval_faithful
     input_cols: eval_faithful_response_dict

sdg_hub/flows/qa_generation/document_grounded_qa/enhanced_multi_summary_qa/key_facts/flow.yaml CHANGED Viewed

@@ -49,7 +49,7 @@ blocks:
     temperature: 0.7
     n: 1
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_atomic_facts
     input_cols: raw_summary
@@ -98,7 +98,7 @@ blocks:
     temperature: 0.7
     n: 1
     async_mode: true
-- block_type: LLMParserBlock
+- block_type: LLMResponseExtractorBlock
   block_config:
     block_name: extract_key_fact_qa
     input_cols: raw_key_fact_qa

sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/flow.yaml CHANGED Viewed

@@ -55,7 +55,7 @@ blocks:
       async_mode: true
       n: 2
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: detailed_summary
       input_cols: raw_summary_detailed
@@ -85,7 +85,7 @@ blocks:
       max_tokens: 2048
       async_mode: true
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: atomic_facts
       input_cols: raw_atomic_facts
@@ -114,7 +114,7 @@ blocks:
       max_tokens: 2048
       async_mode: true
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: extractive_summary
       input_cols: raw_summary_extractive
@@ -160,7 +160,7 @@ blocks:
       max_tokens: 2048
       async_mode: true
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: get_knowledge_generation
       input_cols: raw_knowledge_generation
@@ -191,7 +191,7 @@ blocks:
       n: 1
       async_mode: true
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: extract_eval_faithful
       input_cols: eval_faithful_response_dict
@@ -236,7 +236,7 @@ blocks:
       max_tokens: 2048
       n: 1
       async_mode: true
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: extract_eval_relevancy
       input_cols: eval_relevancy_response_dict
@@ -280,7 +280,7 @@ blocks:
       max_tokens: 2048
       n: 1
       async_mode: true
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: extract_verify_question
       input_cols: verify_question_response_dict

sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/multilingual/japanese/flow.yaml CHANGED Viewed

@@ -57,7 +57,7 @@ blocks:
       async_mode: true
       # n: 2
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: detailed_summary
       input_cols: raw_summary_detailed
@@ -87,7 +87,7 @@ blocks:
       max_tokens: 2048
       async_mode: true
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: atomic_facts
       input_cols: raw_atomic_facts
@@ -116,7 +116,7 @@ blocks:
       max_tokens: 2048
       async_mode: true
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: extractive_summary
       input_cols: raw_summary_extractive
@@ -161,7 +161,7 @@ blocks:
       max_tokens: 2048
       async_mode: true
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: get_knowledge_generation
       input_cols: raw_knowledge_generation
@@ -192,7 +192,7 @@ blocks:
       n: 1
       async_mode: true
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: extract_eval_faithful
       input_cols: eval_faithful_response_dict
@@ -237,7 +237,7 @@ blocks:
       max_tokens: 2048
       n: 1
       async_mode: true
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: extract_eval_relevancy
       input_cols: eval_relevancy_response_dict
@@ -281,7 +281,7 @@ blocks:
       max_tokens: 2048
       n: 1
       async_mode: true
-  - block_type: LLMParserBlock
+  - block_type: LLMResponseExtractorBlock
     block_config:
       block_name: extract_verify_question
       input_cols: verify_question_response_dict

sdg_hub/flows/text_analysis/structured_insights/flow.yaml CHANGED Viewed

@@ -49,7 +49,7 @@ blocks:
       max_tokens: 1024
       temperature: 0.3
       async_mode: true
-  - block_type: "LLMParserBlock"
+  - block_type: "LLMResponseExtractorBlock"
     block_config:
       block_name: "extract_summary"
       input_cols: "raw_summary"
@@ -81,7 +81,7 @@ blocks:
       max_tokens: 512
       temperature: 0.3
       async_mode: true
-  - block_type: "LLMParserBlock"
+  - block_type: "LLMResponseExtractorBlock"
     block_config:
       block_name: "extract_keywords"
       input_cols: "raw_keywords"
@@ -113,7 +113,7 @@ blocks:
       max_tokens: 1024
       temperature: 0.3
       async_mode: true
-  - block_type: "LLMParserBlock"
+  - block_type: "LLMResponseExtractorBlock"
     block_config:
       block_name: "extract_entities"
       input_cols: "raw_entities"
@@ -145,7 +145,7 @@ blocks:
       max_tokens: 256
       temperature: 0.1
       async_mode: true
-  - block_type: "LLMParserBlock"
+  - block_type: "LLMResponseExtractorBlock"
     block_config:
       block_name: "extract_sentiment"
       input_cols: "raw_sentiment"

sdg-hub 0.7.2__py3-none-any.whl → 0.8.0__py3-none-any.whl

sdg-hub 0.7.2py3-none-any.whl → 0.8.0py3-none-any.whl