PyPI - sdg-hub - Versions diffs - 0.2.1__py3-none-any.whl → 0.2.2__py3-none-any.whl - Mend

sdg-hub 0.2.1py3-none-any.whl → 0.2.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

sdg_hub/_version.py +16 -3
sdg_hub/core/blocks/deprecated_blocks/selector.py +1 -1
sdg_hub/core/blocks/evaluation/evaluate_faithfulness_block.py +175 -416
sdg_hub/core/blocks/evaluation/evaluate_relevancy_block.py +174 -415
sdg_hub/core/blocks/evaluation/verify_question_block.py +180 -415
sdg_hub/core/blocks/llm/client_manager.py +61 -24
sdg_hub/core/blocks/llm/config.py +1 -0
sdg_hub/core/blocks/llm/llm_chat_block.py +62 -7
sdg_hub/core/blocks/llm/llm_chat_with_parsing_retry_block.py +277 -115
sdg_hub/core/blocks/llm/text_parser_block.py +0 -2
sdg_hub/core/blocks/registry.py +48 -34
sdg_hub/core/blocks/transform/index_based_mapper.py +1 -1
sdg_hub/core/flow/base.py +131 -10
sdg_hub/core/utils/datautils.py +29 -0
sdg_hub/flows/qa_generation/document_grounded_qa/multi_summary_qa/instructlab/flow.yaml +0 -7
{sdg_hub-0.2.1.dist-info → sdg_hub-0.2.2.dist-info}/METADATA +40 -15
{sdg_hub-0.2.1.dist-info → sdg_hub-0.2.2.dist-info}/RECORD +20 -20
{sdg_hub-0.2.1.dist-info → sdg_hub-0.2.2.dist-info}/WHEEL +0 -0
{sdg_hub-0.2.1.dist-info → sdg_hub-0.2.2.dist-info}/licenses/LICENSE +0 -0
{sdg_hub-0.2.1.dist-info → sdg_hub-0.2.2.dist-info}/top_level.txt +0 -0

sdg_hub/core/blocks/llm/client_manager.py CHANGED Viewed

@@ -160,9 +160,69 @@ class LLMClientManager:
             return response.choices[0].message.content
     async def acreate_completion(
+        self,
+        messages: Union[list[dict[str, Any]], list[list[dict[str, Any]]]],
+        max_concurrency: Optional[int] = None,
+        **overrides: Any,
+    ) -> Union[str, list[str], list[Union[str, list[str]]]]:
+        """Create async completion(s) using LiteLLM with optional concurrency control.
+        Parameters
+        ----------
+        messages : Union[List[Dict[str, Any]], List[List[Dict[str, Any]]]]
+            Single message list or list of message lists.
+            - For single: List[Dict[str, Any]] - returns Union[str, List[str]]
+            - For multiple: List[List[Dict[str, Any]]] - returns List[Union[str, List[str]]]
+        max_concurrency : Optional[int], optional
+            Maximum number of concurrent requests when processing multiple messages.
+            If None, all requests run concurrently.
+        **overrides : Any
+            Runtime parameter overrides.
+        Returns
+        -------
+        Union[str, List[str], List[Union[str, List[str]]]]
+            For single message: completion text (string when n=1, list when n>1)
+            For multiple messages: list of completion texts (each element can be str or List[str])
+        Raises
+        ------
+        Exception
+            If the completion fails after all retries.
+        """
+        # Detect if we have single message or multiple messages
+        if not messages:
+            raise ValueError("messages cannot be empty")
+        # Check if first element is a dict (single message) or list (multiple messages)
+        if isinstance(messages[0], dict):
+            # Single message case
+            return await self._acreate_single(messages, **overrides)
+        else:
+            # Multiple messages case
+            messages_list = messages
+            if max_concurrency is not None:
+                # Use semaphore for concurrency control
+                semaphore = asyncio.Semaphore(max_concurrency)
+                async def _create_with_semaphore(msgs):
+                    async with semaphore:
+                        return await self._acreate_single(msgs, **overrides)
+                tasks = [_create_with_semaphore(msgs) for msgs in messages_list]
+                return await asyncio.gather(*tasks)
+            else:
+                # No concurrency limit - process all at once
+                tasks = [
+                    self._acreate_single(msgs, **overrides) for msgs in messages_list
+                ]
+                return await asyncio.gather(*tasks)
+    async def _acreate_single(
         self, messages: list[dict[str, Any]], **overrides: Any
     ) -> Union[str, list[str]]:
-        """Create an async completion using LiteLLM.
+        """Create a single async completion using LiteLLM.
         Parameters
         ----------
@@ -235,29 +295,6 @@ class LLMClientManager:
             results.append(result)
         return results
-    async def acreate_completions_batch(
-        self, messages_list: list[list[dict[str, Any]]], **overrides: Any
-    ) -> list[Union[str, list[str]]]:
-        """Create multiple completions in batch asynchronously.
-        Parameters
-        ----------
-        messages_list : List[List[Dict[str, Any]]]
-            List of message lists to process.
-        **overrides : Any
-            Runtime parameter overrides.
-        Returns
-        -------
-        List[Union[str, List[str]]]
-            List of completion texts. Each element is a single string when n=1 or n is None,
-            or a list of strings when n>1.
-        """
-        tasks = [
-            self.acreate_completion(messages, **overrides) for messages in messages_list
-        ]
-        return await asyncio.gather(*tasks)
     def _build_completion_kwargs(
         self, messages: list[dict[str, Any]], config: LLMConfig
     ) -> dict[str, Any]:

sdg_hub/core/blocks/llm/config.py CHANGED Viewed

@@ -240,6 +240,7 @@ class LLMConfig:
             "logprobs",
             "top_logprobs",
             "user",
+            "timeout",
         ]:
             value = getattr(self, param)
             if value is not None:

sdg_hub/core/blocks/llm/llm_chat_block.py CHANGED Viewed

@@ -297,6 +297,10 @@ class LLMChatBlock(BaseBlock):
             temperature, max_tokens, top_p, frequency_penalty, presence_penalty,
             stop, seed, response_format, stream, n, and provider-specific params.
+            Special flow-level parameters:
+            _flow_max_concurrency : int, optional
+                Maximum concurrency for async requests (passed by Flow).
         Returns
         -------
         Dataset
@@ -314,27 +318,73 @@ class LLMChatBlock(BaseBlock):
                 f"Call flow.set_model_config() before generating."
             )
+        # Extract max_concurrency if provided by flow
+        flow_max_concurrency = override_kwargs.pop("_flow_max_concurrency", None)
         # Extract messages
         messages_list = samples[self.input_cols[0]]
         # Log generation start
         logger.info(
-            f"Starting {'async' if self.async_mode else 'sync'} generation for {len(messages_list)} samples",
+            f"Starting {'async' if self.async_mode else 'sync'} generation for {len(messages_list)} samples"
+            + (
+                f" (max_concurrency={flow_max_concurrency})"
+                if flow_max_concurrency
+                else ""
+            ),
             extra={
                 "block_name": self.block_name,
                 "model": self.model,
                 "provider": self.client_manager.config.get_provider(),
                 "batch_size": len(messages_list),
                 "async_mode": self.async_mode,
-                "override_params": override_kwargs,
+                "flow_max_concurrency": flow_max_concurrency,
+                "override_params": {
+                    k: (
+                        "***"
+                        if any(
+                            s in k.lower()
+                            for s in ["key", "token", "secret", "authorization"]
+                        )
+                        else v
+                    )
+                    for k, v in override_kwargs.items()
+                },
             },
         )
         # Generate responses
         if self.async_mode:
-            responses = asyncio.run(
-                self._generate_async(messages_list, **override_kwargs)
-            )
+            try:
+                # Check if there's already a running event loop
+                loop = asyncio.get_running_loop()
+                # Check if nest_asyncio is applied (allows nested asyncio.run)
+                # Use multiple detection methods for robustness
+                nest_asyncio_applied = (
+                    hasattr(loop, "_nest_patched")
+                    or getattr(asyncio.run, "__module__", "") == "nest_asyncio"
+                )
+                if nest_asyncio_applied:
+                    # nest_asyncio is applied, safe to use asyncio.run
+                    responses = asyncio.run(
+                        self._generate_async(
+                            messages_list, flow_max_concurrency, **override_kwargs
+                        )
+                    )
+                else:
+                    # Running inside an event loop without nest_asyncio
+                    raise BlockValidationError(
+                        f"async_mode=True cannot be used from within a running event loop for '{self.block_name}'. "
+                        "Use an async entrypoint, set async_mode=False, or apply nest_asyncio.apply() in notebook environments."
+                    )
+            except RuntimeError:
+                # No running loop; safe to create one
+                responses = asyncio.run(
+                    self._generate_async(
+                        messages_list, flow_max_concurrency, **override_kwargs
+                    )
+                )
         else:
             responses = self._generate_sync(messages_list, **override_kwargs)
@@ -409,6 +459,7 @@ class LLMChatBlock(BaseBlock):
     async def _generate_async(
         self,
         messages_list: list[list[dict[str, Any]]],
+        flow_max_concurrency: Optional[int] = None,
         **override_kwargs: dict[str, Any],
     ) -> list[Union[str, list[str]]]:
         """Generate responses asynchronously.
@@ -417,6 +468,8 @@ class LLMChatBlock(BaseBlock):
         ----------
         messages_list : List[List[Dict[str, Any]]]
             List of message lists to process.
+        flow_max_concurrency : Optional[int], optional
+            Maximum concurrency for async requests.
         **override_kwargs : Dict[str, Any]
             Runtime parameter overrides.
@@ -426,9 +479,11 @@ class LLMChatBlock(BaseBlock):
             List of response strings or lists of response strings (when n > 1).
         """
         try:
-            responses = await self.client_manager.acreate_completions_batch(
-                messages_list, **override_kwargs
+            # Use unified client manager method with optional concurrency control
+            responses = await self.client_manager.acreate_completion(
+                messages_list, max_concurrency=flow_max_concurrency, **override_kwargs
             )
             return responses
         except Exception as e:

sdg-hub 0.2.1__py3-none-any.whl → 0.2.2__py3-none-any.whl

sdg-hub 0.2.1py3-none-any.whl → 0.2.2py3-none-any.whl