PyPI - aiqtoolkit - Versions diffs - 1.2.0.dev0__py3-none-any.whl → 1.2.0rc2__py3-none-any.whl - Mend

aiqtoolkit 1.2.0.dev0py3-none-any.whl → 1.2.0rc2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of aiqtoolkit might be problematic. Click here for more details.

Files changed (220) hide show

aiq/agent/base.py +170 -8
aiq/agent/dual_node.py +1 -1
aiq/agent/react_agent/agent.py +146 -112
aiq/agent/react_agent/prompt.py +1 -6
aiq/agent/react_agent/register.py +36 -35
aiq/agent/rewoo_agent/agent.py +36 -35
aiq/agent/rewoo_agent/register.py +2 -2
aiq/agent/tool_calling_agent/agent.py +3 -7
aiq/agent/tool_calling_agent/register.py +1 -1
aiq/authentication/__init__.py +14 -0
aiq/authentication/api_key/__init__.py +14 -0
aiq/authentication/api_key/api_key_auth_provider.py +92 -0
aiq/authentication/api_key/api_key_auth_provider_config.py +124 -0
aiq/authentication/api_key/register.py +26 -0
aiq/authentication/exceptions/__init__.py +14 -0
aiq/authentication/exceptions/api_key_exceptions.py +38 -0
aiq/authentication/exceptions/auth_code_grant_exceptions.py +86 -0
aiq/authentication/exceptions/call_back_exceptions.py +38 -0
aiq/authentication/exceptions/request_exceptions.py +54 -0
aiq/authentication/http_basic_auth/__init__.py +0 -0
aiq/authentication/http_basic_auth/http_basic_auth_provider.py +81 -0
aiq/authentication/http_basic_auth/register.py +30 -0
aiq/authentication/interfaces.py +93 -0
aiq/authentication/oauth2/__init__.py +14 -0
aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +107 -0
aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +39 -0
aiq/authentication/oauth2/register.py +25 -0
aiq/authentication/register.py +21 -0
aiq/builder/builder.py +64 -2
aiq/builder/component_utils.py +16 -3
aiq/builder/context.py +37 -0
aiq/builder/eval_builder.py +43 -2
aiq/builder/function.py +44 -12
aiq/builder/function_base.py +1 -1
aiq/builder/intermediate_step_manager.py +6 -8
aiq/builder/user_interaction_manager.py +3 -0
aiq/builder/workflow.py +23 -18
aiq/builder/workflow_builder.py +421 -61
aiq/cli/commands/info/list_mcp.py +103 -16
aiq/cli/commands/sizing/__init__.py +14 -0
aiq/cli/commands/sizing/calc.py +294 -0
aiq/cli/commands/sizing/sizing.py +27 -0
aiq/cli/commands/start.py +2 -1
aiq/cli/entrypoint.py +2 -0
aiq/cli/register_workflow.py +80 -0
aiq/cli/type_registry.py +151 -30
aiq/data_models/api_server.py +124 -12
aiq/data_models/authentication.py +231 -0
aiq/data_models/common.py +35 -7
aiq/data_models/component.py +17 -9
aiq/data_models/component_ref.py +33 -0
aiq/data_models/config.py +60 -3
aiq/data_models/dataset_handler.py +2 -1
aiq/data_models/embedder.py +1 -0
aiq/data_models/evaluate.py +23 -0
aiq/data_models/function_dependencies.py +8 -0
aiq/data_models/interactive.py +10 -1
aiq/data_models/intermediate_step.py +38 -5
aiq/data_models/its_strategy.py +30 -0
aiq/data_models/llm.py +1 -0
aiq/data_models/memory.py +1 -0
aiq/data_models/object_store.py +44 -0
aiq/data_models/profiler.py +1 -0
aiq/data_models/retry_mixin.py +35 -0
aiq/data_models/span.py +187 -0
aiq/data_models/telemetry_exporter.py +2 -2
aiq/embedder/nim_embedder.py +2 -1
aiq/embedder/openai_embedder.py +2 -1
aiq/eval/config.py +19 -1
aiq/eval/dataset_handler/dataset_handler.py +87 -2
aiq/eval/evaluate.py +208 -27
aiq/eval/evaluator/base_evaluator.py +73 -0
aiq/eval/evaluator/evaluator_model.py +1 -0
aiq/eval/intermediate_step_adapter.py +11 -5
aiq/eval/rag_evaluator/evaluate.py +55 -15
aiq/eval/rag_evaluator/register.py +6 -1
aiq/eval/remote_workflow.py +7 -2
aiq/eval/runners/__init__.py +14 -0
aiq/eval/runners/config.py +39 -0
aiq/eval/runners/multi_eval_runner.py +54 -0
aiq/eval/trajectory_evaluator/evaluate.py +22 -65
aiq/eval/tunable_rag_evaluator/evaluate.py +150 -168
aiq/eval/tunable_rag_evaluator/register.py +2 -0
aiq/eval/usage_stats.py +41 -0
aiq/eval/utils/output_uploader.py +10 -1
aiq/eval/utils/weave_eval.py +184 -0
aiq/experimental/__init__.py +0 -0
aiq/experimental/decorators/__init__.py +0 -0
aiq/experimental/decorators/experimental_warning_decorator.py +130 -0
aiq/experimental/inference_time_scaling/__init__.py +0 -0
aiq/experimental/inference_time_scaling/editing/__init__.py +0 -0
aiq/experimental/inference_time_scaling/editing/iterative_plan_refinement_editor.py +147 -0
aiq/experimental/inference_time_scaling/editing/llm_as_a_judge_editor.py +204 -0
aiq/experimental/inference_time_scaling/editing/motivation_aware_summarization.py +107 -0
aiq/experimental/inference_time_scaling/functions/__init__.py +0 -0
aiq/experimental/inference_time_scaling/functions/execute_score_select_function.py +105 -0
aiq/experimental/inference_time_scaling/functions/its_tool_orchestration_function.py +205 -0
aiq/experimental/inference_time_scaling/functions/its_tool_wrapper_function.py +146 -0
aiq/experimental/inference_time_scaling/functions/plan_select_execute_function.py +224 -0
aiq/experimental/inference_time_scaling/models/__init__.py +0 -0
aiq/experimental/inference_time_scaling/models/editor_config.py +132 -0
aiq/experimental/inference_time_scaling/models/its_item.py +48 -0
aiq/experimental/inference_time_scaling/models/scoring_config.py +112 -0
aiq/experimental/inference_time_scaling/models/search_config.py +120 -0
aiq/experimental/inference_time_scaling/models/selection_config.py +154 -0
aiq/experimental/inference_time_scaling/models/stage_enums.py +43 -0
aiq/experimental/inference_time_scaling/models/strategy_base.py +66 -0
aiq/experimental/inference_time_scaling/models/tool_use_config.py +41 -0
aiq/experimental/inference_time_scaling/register.py +36 -0
aiq/experimental/inference_time_scaling/scoring/__init__.py +0 -0
aiq/experimental/inference_time_scaling/scoring/llm_based_agent_scorer.py +168 -0
aiq/experimental/inference_time_scaling/scoring/llm_based_plan_scorer.py +168 -0
aiq/experimental/inference_time_scaling/scoring/motivation_aware_scorer.py +111 -0
aiq/experimental/inference_time_scaling/search/__init__.py +0 -0
aiq/experimental/inference_time_scaling/search/multi_llm_planner.py +128 -0
aiq/experimental/inference_time_scaling/search/multi_query_retrieval_search.py +122 -0
aiq/experimental/inference_time_scaling/search/single_shot_multi_plan_planner.py +128 -0
aiq/experimental/inference_time_scaling/selection/__init__.py +0 -0
aiq/experimental/inference_time_scaling/selection/best_of_n_selector.py +63 -0
aiq/experimental/inference_time_scaling/selection/llm_based_agent_output_selector.py +131 -0
aiq/experimental/inference_time_scaling/selection/llm_based_output_merging_selector.py +159 -0
aiq/experimental/inference_time_scaling/selection/llm_based_plan_selector.py +128 -0
aiq/experimental/inference_time_scaling/selection/threshold_selector.py +58 -0
aiq/front_ends/console/authentication_flow_handler.py +233 -0
aiq/front_ends/console/console_front_end_plugin.py +11 -2
aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +27 -0
aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +107 -0
aiq/front_ends/fastapi/fastapi_front_end_config.py +93 -9
aiq/front_ends/fastapi/fastapi_front_end_controller.py +68 -0
aiq/front_ends/fastapi/fastapi_front_end_plugin.py +14 -1
aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +537 -52
aiq/front_ends/fastapi/html_snippets/__init__.py +14 -0
aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +35 -0
aiq/front_ends/fastapi/job_store.py +47 -25
aiq/front_ends/fastapi/main.py +2 -0
aiq/front_ends/fastapi/message_handler.py +108 -89
aiq/front_ends/fastapi/step_adaptor.py +2 -1
aiq/llm/aws_bedrock_llm.py +57 -0
aiq/llm/nim_llm.py +2 -1
aiq/llm/openai_llm.py +3 -2
aiq/llm/register.py +1 -0
aiq/meta/pypi.md +12 -12
aiq/object_store/__init__.py +20 -0
aiq/object_store/in_memory_object_store.py +74 -0
aiq/object_store/interfaces.py +84 -0
aiq/object_store/models.py +36 -0
aiq/object_store/register.py +20 -0
aiq/observability/__init__.py +14 -0
aiq/observability/exporter/__init__.py +14 -0
aiq/observability/exporter/base_exporter.py +449 -0
aiq/observability/exporter/exporter.py +78 -0
aiq/observability/exporter/file_exporter.py +33 -0
aiq/observability/exporter/processing_exporter.py +269 -0
aiq/observability/exporter/raw_exporter.py +52 -0
aiq/observability/exporter/span_exporter.py +264 -0
aiq/observability/exporter_manager.py +335 -0
aiq/observability/mixin/__init__.py +14 -0
aiq/observability/mixin/batch_config_mixin.py +26 -0
aiq/observability/mixin/collector_config_mixin.py +23 -0
aiq/observability/mixin/file_mixin.py +288 -0
aiq/observability/mixin/file_mode.py +23 -0
aiq/observability/mixin/resource_conflict_mixin.py +134 -0
aiq/observability/mixin/serialize_mixin.py +61 -0
aiq/observability/mixin/type_introspection_mixin.py +183 -0
aiq/observability/processor/__init__.py +14 -0
aiq/observability/processor/batching_processor.py +316 -0
aiq/observability/processor/intermediate_step_serializer.py +28 -0
aiq/observability/processor/processor.py +68 -0
aiq/observability/register.py +36 -39
aiq/observability/utils/__init__.py +14 -0
aiq/observability/utils/dict_utils.py +236 -0
aiq/observability/utils/time_utils.py +31 -0
aiq/profiler/calc/__init__.py +14 -0
aiq/profiler/calc/calc_runner.py +623 -0
aiq/profiler/calc/calculations.py +288 -0
aiq/profiler/calc/data_models.py +176 -0
aiq/profiler/calc/plot.py +345 -0
aiq/profiler/callbacks/langchain_callback_handler.py +22 -10
aiq/profiler/data_models.py +24 -0
aiq/profiler/inference_metrics_model.py +3 -0
aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +8 -0
aiq/profiler/inference_optimization/data_models.py +2 -2
aiq/profiler/inference_optimization/llm_metrics.py +2 -2
aiq/profiler/profile_runner.py +61 -21
aiq/runtime/loader.py +9 -3
aiq/runtime/runner.py +23 -9
aiq/runtime/session.py +25 -7
aiq/runtime/user_metadata.py +2 -3
aiq/tool/chat_completion.py +74 -0
aiq/tool/code_execution/README.md +152 -0
aiq/tool/code_execution/code_sandbox.py +151 -72
aiq/tool/code_execution/local_sandbox/.gitignore +1 -0
aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +139 -24
aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +3 -1
aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +27 -2
aiq/tool/code_execution/register.py +7 -3
aiq/tool/code_execution/test_code_execution_sandbox.py +414 -0
aiq/tool/mcp/exceptions.py +142 -0
aiq/tool/mcp/mcp_client.py +41 -6
aiq/tool/mcp/mcp_tool.py +3 -2
aiq/tool/register.py +1 -0
aiq/tool/server_tools.py +6 -3
aiq/utils/exception_handlers/automatic_retries.py +289 -0
aiq/utils/exception_handlers/mcp.py +211 -0
aiq/utils/io/model_processing.py +28 -0
aiq/utils/log_utils.py +37 -0
aiq/utils/string_utils.py +38 -0
aiq/utils/type_converter.py +18 -2
aiq/utils/type_utils.py +87 -0
{aiqtoolkit-1.2.0.dev0.dist-info → aiqtoolkit-1.2.0rc2.dist-info}/METADATA +53 -21
aiqtoolkit-1.2.0rc2.dist-info/RECORD +436 -0
{aiqtoolkit-1.2.0.dev0.dist-info → aiqtoolkit-1.2.0rc2.dist-info}/WHEEL +1 -1
{aiqtoolkit-1.2.0.dev0.dist-info → aiqtoolkit-1.2.0rc2.dist-info}/entry_points.txt +3 -0
aiq/front_ends/fastapi/websocket.py +0 -148
aiq/observability/async_otel_listener.py +0 -429
aiqtoolkit-1.2.0.dev0.dist-info/RECORD +0 -316
{aiqtoolkit-1.2.0.dev0.dist-info → aiqtoolkit-1.2.0rc2.dist-info}/licenses/LICENSE-3rd-party.txt +0 -0
{aiqtoolkit-1.2.0.dev0.dist-info → aiqtoolkit-1.2.0rc2.dist-info}/licenses/LICENSE.md +0 -0
{aiqtoolkit-1.2.0.dev0.dist-info → aiqtoolkit-1.2.0rc2.dist-info}/top_level.txt +0 -0

aiq/experimental/inference_time_scaling/editing/llm_as_a_judge_editor.py ADDED Viewed

@@ -0,0 +1,204 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import asyncio
+import logging
+import re
+from aiq.builder.builder import Builder
+from aiq.builder.framework_enum import LLMFrameworkEnum
+from aiq.cli.register_workflow import register_its_strategy
+from aiq.data_models.its_strategy import ITSStrategyBaseConfig
+from aiq.experimental.inference_time_scaling.models.editor_config import LLMAsAJudgeEditorConfig
+from aiq.experimental.inference_time_scaling.models.its_item import ITSItem
+from aiq.experimental.inference_time_scaling.models.stage_enums import PipelineTypeEnum
+from aiq.experimental.inference_time_scaling.models.stage_enums import StageTypeEnum
+from aiq.experimental.inference_time_scaling.models.strategy_base import StrategyBase
+from aiq.utils.io.model_processing import remove_r1_think_tags
+logger = logging.getLogger(__name__)
+class LLMAsAJudgeEditor(StrategyBase):
+    """
+    Given a list of PlanningItems, uses a feedback LLM to generate feedback on each plan
+    Then edits the plan based on feedback.
+    """
+    def __init__(self, config: ITSStrategyBaseConfig) -> None:
+        super().__init__(config)
+        self.feedback_llm = None
+        self.editing_llm = None
+    async def build_components(self, builder: Builder) -> None:
+        """
+        Build the components required for the editor.
+        """
+        # Get the feedback LLM
+        self.feedback_llm = await builder.get_llm(self.config.feedback_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
+        self.editing_llm = await builder.get_llm(self.config.editing_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
+    def supported_pipeline_types(self) -> [PipelineTypeEnum]:
+        return [PipelineTypeEnum.PLANNING]
+    def stage_type(self) -> StageTypeEnum:
+        return StageTypeEnum.EDITING
+    async def generate_feedback(self, llm, template, context: str, prompt: str, item: ITSItem) -> ITSItem:
+        """
+        Helper function to generate feedback for a given planning item using the provided prompt.
+        """
+        prompt = await template.ainvoke(
+            input={
+                "context": context,
+                "original_prompt": prompt,  # Original prompt used to generate the plans
+                "plan": item.plan,
+                "num_feedback": self.config.num_feedback
+            })
+        feedback_result = await llm.ainvoke(prompt.to_string())
+        if not feedback_result:
+            logger.warning(f"No feedback generated for plan: {item.plan}.")
+            return item
+        # Update the planning item with the generated feedback
+        cleaned = remove_r1_think_tags(
+            feedback_result.content if hasattr(feedback_result, 'content') else str(feedback_result))
+        # Feedback is the string following 'FEEDBACK:'. Use Regex to extract
+        cleaned = re.sub(r'(?i)^\s*FEEDBACK:\s*', '', cleaned).strip()
+        if not cleaned:
+            logger.warning(f"Feedback was empty for plan: {item.plan}.")
+            return item
+        item.feedback = cleaned  # Set the feedback in the ITSItem
+        return item
+    async def edit_plan(self, llm, template, context: str, prompt: str, item: ITSItem) -> ITSItem:
+        """
+        Helper function to edit a plan based on feedback using the provided prompt.
+        """
+        if not item.feedback:
+            logger.warning(f"No feedback available for plan: {item.plan}. Cannot edit.")
+            return item
+        prompt = await template.ainvoke(
+            input={
+                "context": context,
+                "original_prompt": prompt,  # Original prompt used to generate the plans
+                "plan": item.plan,
+                "feedback": item.feedback
+            })
+        editing_result = await llm.ainvoke(prompt.to_string())
+        if not editing_result:
+            logger.warning(f"No editing result generated for plan: {item.plan}.")
+            return item
+        # Update the planning item with the edited plan
+        cleaned = remove_r1_think_tags(
+            editing_result.content if hasattr(editing_result, 'content') else str(editing_result))
+        # Plan is the string following 'EDITED PLAN:'. Use Regex to extract
+        cleaned = re.sub(r'(?i)^\s*EDITED PLAN:\s*', '', cleaned).strip()
+        if not cleaned:
+            logger.warning(f"Edited plan was empty for plan: {item.plan}. Returning original.")
+            return item
+        # Update the plan in the PlanningItem
+        item.plan = cleaned
+        return item
+    async def ainvoke(self,
+                      items: list[ITSItem],
+                      original_prompt: str | None = None,
+                      agent_context: str | None = None,
+                      **kwargs) -> list[ITSItem]:
+        """
+        Edit the provided planning items using a feedback LLM.
+        """
+        from langchain_core.language_models import BaseChatModel
+        from langchain_core.prompts import PromptTemplate
+        # assert self.config.feedback_llm is a BaseChatModel
+        if not isinstance(self.feedback_llm, BaseChatModel):
+            raise ValueError("The `feedback_llm` must be an instance of `BaseChatModel`.")
+        # assert self.config.editing_llm is a BaseChatModel
+        if not isinstance(self.editing_llm, BaseChatModel):
+            raise ValueError("The `editing_llm` must be an instance of `BaseChatModel`.")
+        feedback_model: BaseChatModel = self.feedback_llm
+        editing_model: BaseChatModel = self.editing_llm
+        feedback_template = PromptTemplate(template=self.config.feedback_template,
+                                           input_variables=["context", "original_prompt", "plan", "num_feedback"],
+                                           validate_template=True)
+        editing_template = PromptTemplate(template=self.config.editor_template,
+                                          input_variables=["context", "original_prompt", "plan", "feedback"],
+                                          validate_template=True)
+        # Generate feedback for each planning item concurrently
+        feedback_tasks = [
+            self.generate_feedback(
+                llm=feedback_model,
+                template=feedback_template,
+                context=agent_context,
+                prompt=original_prompt,  # Original prompt used to generate the plans
+                item=item) for item in items
+        ]
+        # Run the feedback tasks concurrently and gather results
+        planning_items_with_feedback = await asyncio.gather(*feedback_tasks)
+        if not planning_items_with_feedback:
+            raise ValueError("No feedback was generated for the planning items. Please check the LLM response.")
+        logger.info("Generated feedback for %d plans.", len(planning_items_with_feedback))
+        # Now edit each planning item based on the feedback concurrently
+        editing_tasks = [
+            self.edit_plan(
+                llm=editing_model,
+                template=editing_template,
+                context=agent_context,
+                prompt=original_prompt,  # Original prompt used to generate the plans
+                item=item) for item in planning_items_with_feedback
+        ]
+        # Run the editing tasks concurrently and gather results
+        edited_planning_items = await asyncio.gather(*editing_tasks)
+        if not edited_planning_items:
+            raise ValueError("No plans were edited. Please check the LLM response.")
+        logger.info("Edited %d plans based on feedback.", len(edited_planning_items))
+        return edited_planning_items
+@register_its_strategy(config_type=LLMAsAJudgeEditorConfig)
+async def register_llm_as_a_judge_editor(config: ITSStrategyBaseConfig, builder: Builder):
+    """
+    Register the LLMAsAJudgeEditor strategy with the provided configuration and builder.
+    """
+    editor = LLMAsAJudgeEditor(config)
+    await editor.build_components(builder)
+    yield editor

aiq/experimental/inference_time_scaling/editing/motivation_aware_summarization.py ADDED Viewed

@@ -0,0 +1,107 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import logging
+from aiq.builder.builder import Builder
+from aiq.builder.framework_enum import LLMFrameworkEnum
+from aiq.cli.register_workflow import register_its_strategy
+from aiq.experimental.inference_time_scaling.models.editor_config import MotivationAwareSummarizationConfig
+from aiq.experimental.inference_time_scaling.models.its_item import ITSItem
+from aiq.experimental.inference_time_scaling.models.stage_enums import PipelineTypeEnum
+from aiq.experimental.inference_time_scaling.models.stage_enums import StageTypeEnum
+from aiq.experimental.inference_time_scaling.models.strategy_base import StrategyBase
+from aiq.utils.io.model_processing import remove_r1_think_tags
+logger = logging.getLogger(__name__)
+class MotivationAwareSummarization(StrategyBase):
+    """
+    A strategy that, for each incoming ITSItem, summarizes the output based on input
+    and motivation.
+    """
+    def __init__(self, config: MotivationAwareSummarizationConfig) -> None:
+        super().__init__(config)
+        self.config = config
+        self.llm_bound = None
+    async def build_components(self, builder: Builder) -> None:
+        """
+        Binds each LLMRef in self.config.llms to an actual LLM client.
+        """
+        bound_llm = await builder.get_llm(self.config.editor_llm, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
+        self.llm_bound = bound_llm
+    def supported_pipeline_types(self) -> list[PipelineTypeEnum]:
+        return [PipelineTypeEnum.TOOL_USE]
+    def stage_type(self) -> StageTypeEnum:
+        return StageTypeEnum.EDITING
+    async def ainvoke(self,
+                      items: list[ITSItem],
+                      original_prompt: str | None = None,
+                      agent_context: str | None = None,
+                      **kwargs) -> list[ITSItem]:
+        """
+        For each ITSItem, rewrite the 'input' using each LLM to create a new perspective.
+        The new ITSItems' 'output' field will store the newly generated query.
+        """
+        try:
+            from langchain_core.prompts import PromptTemplate
+        except ImportError:
+            raise ImportError("langchain-core is required for MultiQueryRetrievalSearch. "
+                              "Install aiqtoolkit-langchain or similar.")
+        new_its_items: list[ITSItem] = []
+        # Create a single PromptTemplate object for rewriting the query
+        template_vars = ["task", "motivation", "output"]
+        query_template = PromptTemplate(template=self.config.editor_template,
+                                        input_variables=template_vars,
+                                        validate_template=True)
+        for item in items:
+            original_task = str(item.input) or ""
+            motivation = str(item.metadata) if item.metadata else ""
+            output = str(item.output) if item.output else ""
+            prompt = await (query_template.ainvoke(input={
+                "task": original_task, "motivation": motivation, "output": output
+            }))
+            llm_response = await self.llm_bound.ainvoke(prompt.to_string())
+            llm_response = remove_r1_think_tags(llm_response.content)
+            logger.info("LLM response from summarization: %s", llm_response)
+            new_its_items.append(
+                ITSItem(
+                    input=item.input,
+                    output=remove_r1_think_tags(llm_response),
+                    metadata=item.metadata,
+                    name=item.name,  # keep the original tool name
+                ))
+        return new_its_items
+@register_its_strategy(config_type=MotivationAwareSummarizationConfig)
+async def register_multi_query_retrieval_search(config: MotivationAwareSummarizationConfig, builder: Builder):
+    strategy = MotivationAwareSummarization(config)
+    await strategy.build_components(builder)
+    yield strategy

aiq/experimental/inference_time_scaling/functions/__init__.py ADDED Viewed

File without changes

aiq/experimental/inference_time_scaling/functions/execute_score_select_function.py ADDED Viewed

@@ -0,0 +1,105 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import logging
+from pydantic import Field
+from aiq.builder.builder import Builder
+from aiq.builder.function import Function
+from aiq.builder.function_info import FunctionInfo
+from aiq.cli.register_workflow import register_function
+from aiq.data_models.component_ref import FunctionRef
+from aiq.data_models.component_ref import ITSStrategyRef
+from aiq.data_models.function import FunctionBaseConfig
+from aiq.experimental.inference_time_scaling.models.its_item import ITSItem
+from aiq.experimental.inference_time_scaling.models.stage_enums import PipelineTypeEnum
+from aiq.experimental.inference_time_scaling.models.stage_enums import StageTypeEnum
+logger = logging.getLogger(__name__)
+class ExecuteScoreSelectFunctionConfig(FunctionBaseConfig, name="execute_score_select_function"):
+    scorer: ITSStrategyRef | None = Field(description="Strategy to score the output of the function", default=None)
+    selector: ITSStrategyRef = Field(description="Strategy to select the best output of the function")
+    augmented_fn: FunctionRef = Field(description="Function that will be executed")
+    num_executions: int = Field(3, description="Number of times to execute the function")
+@register_function(config_type=ExecuteScoreSelectFunctionConfig)
+async def execute_score_select_function(config: ExecuteScoreSelectFunctionConfig, builder: Builder):
+    import asyncio
+    import warnings
+    from pydantic import BaseModel
+    executable_fn: Function = builder.get_function(name=config.augmented_fn)
+    if config.scorer:
+        scorer = await builder.get_its_strategy(strategy_name=config.scorer,
+                                                pipeline_type=PipelineTypeEnum.AGENT_EXECUTION,
+                                                stage_type=StageTypeEnum.SCORING)
+    else:
+        scorer = None
+    selector = await builder.get_its_strategy(strategy_name=config.selector,
+                                              pipeline_type=PipelineTypeEnum.AGENT_EXECUTION,
+                                              stage_type=StageTypeEnum.SELECTION)
+    if executable_fn.has_streaming_output:
+        warnings.warn("Streaming output is not supported for this function. "
+                      "The function will be executed in non-streaming mode.")
+    def convert_to_str(arg):
+        if isinstance(arg, BaseModel):
+            return str(arg.model_dump())
+        return str(arg)
+    async def execute_fn(input_msg: executable_fn.input_type) -> executable_fn.single_output_type:
+        logger.info("Executing function %d times", config.num_executions)
+        tasks = [executable_fn.ainvoke(input_msg) for _ in range(config.num_executions)]
+        results = await asyncio.gather(*tasks)
+        input_str = convert_to_str(input_msg)
+        function_outputs = [convert_to_str(out) for out in results]
+        its_items = [ITSItem(
+            input=input_str,
+            output=out,
+        ) for out in function_outputs]
+        if scorer:
+            logger.info("Beginning scoring")
+            its_items = await scorer.ainvoke(items=its_items)
+        logger.info("Beginning selection")
+        selected_item = (await selector.ainvoke(items=its_items, original_prompt=its_items[0].input))[0]
+        # Find the index of selected item in its_items by matching the output
+        selected_output = selected_item.output
+        selected_index = -1
+        for i, item in enumerate(its_items):
+            if item.output == selected_output:
+                selected_index = i
+                break
+        return results[selected_index] if selected_index != -1 else selected_output
+    yield FunctionInfo.from_fn(
+        fn=execute_fn,
+        description=("This function executes a given function multiple times, scores the outputs, "
+                     "and selects the best output based on the specified scoring and selection strategies."),
+    )

aiq/experimental/inference_time_scaling/functions/its_tool_orchestration_function.py ADDED Viewed

@@ -0,0 +1,205 @@
+# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import asyncio
+import logging
+from pydantic import Field
+from aiq.builder.builder import Builder
+from aiq.builder.framework_enum import LLMFrameworkEnum
+from aiq.builder.function_info import FunctionInfo
+from aiq.cli.register_workflow import register_function
+from aiq.data_models.component_ref import FunctionRef
+from aiq.data_models.component_ref import ITSStrategyRef
+from aiq.data_models.function import FunctionBaseConfig
+from aiq.experimental.inference_time_scaling.models.its_item import ITSItem
+from aiq.experimental.inference_time_scaling.models.stage_enums import PipelineTypeEnum
+from aiq.experimental.inference_time_scaling.models.stage_enums import StageTypeEnum
+from aiq.experimental.inference_time_scaling.models.tool_use_config import ToolUseInputSchema
+from aiq.experimental.inference_time_scaling.models.tool_use_config import ToolUselist
+logger = logging.getLogger(__name__)
+class ITSToolOrchestrationFunctionConfig(FunctionBaseConfig, name="its_tool_orchestration"):
+    """
+    Configuration for the ITSToolOrchestrationFunction, which is used to orchestrate multiple functions.
+    """
+    augmented_fns: list[FunctionRef] = Field(
+        description="list of FunctionRefs for the functions to be orchestrated. Must be wrapped in `its_tool_wrapper`.")
+    search_strategy: ITSStrategyRef | None = Field(
+        description="The ITS search strategy to use for orchestrating invocation of the functions."
+        " If None, no search will be performed.",
+        default=None,
+    )
+    editing_strategy: ITSStrategyRef | None = Field(
+        default=None,
+        description="The ITS editing strategy to use for orchestrating invocation of the functions. "
+        "If None, no editing will be performed.",
+    )
+    scoring_strategy: ITSStrategyRef | None = Field(
+        default=None,
+        description="The ITS scoring strategy to use for orchestrating invocation of the functions. "
+        "If None, no scoring will be performed.",
+    )
+    selection_strategy: ITSStrategyRef = Field(
+        description="The ITS selection strategy to use for orchestrating invocation of the functions.")
+@register_function(config_type=ITSToolOrchestrationFunctionConfig, framework_wrappers=[LLMFrameworkEnum.LANGCHAIN])
+async def register_its_tool_orchestration_function(
+    config: ITSToolOrchestrationFunctionConfig,
+    builder: Builder,
+):
+    """
+    Registers an ITS-based orchestration function that:
+     1. Instantiates all relevant strategies (search, editing, scoring, selection).
+     2. Accepts a ToolUselist, converts each item to an ITSItem, optionally runs search/editing.
+     3. Calls the correct augmented_fn per item using name=tool name.
+     4. If configured, runs scoring and selection on the result.
+     5. Returns a new ToolUselist with each output set.
+    """
+    # 1) Gather references to all augmented (wrapped) functions
+    function_map = {}
+    for fn_ref in config.augmented_fns:
+        # Retrieve the actual function from the builder
+        fn_obj = builder.get_function(fn_ref)
+        function_map[fn_ref] = fn_obj
+    # 2) Instantiate search, editing, scoring, selection strategies (if any)
+    search = None
+    if config.search_strategy is not None:
+        search = await builder.get_its_strategy(
+            strategy_name=config.search_strategy,
+            pipeline_type=PipelineTypeEnum.TOOL_USE,
+            stage_type=StageTypeEnum.SEARCH,
+        )
+    editing = None
+    if config.editing_strategy is not None:
+        editing = await builder.get_its_strategy(
+            strategy_name=config.editing_strategy,
+            pipeline_type=PipelineTypeEnum.TOOL_USE,
+            stage_type=StageTypeEnum.EDITING,
+        )
+    scoring = None
+    if config.scoring_strategy is not None:
+        scoring = await builder.get_its_strategy(
+            strategy_name=config.scoring_strategy,
+            pipeline_type=PipelineTypeEnum.TOOL_USE,
+            stage_type=StageTypeEnum.SCORING,
+        )
+    selection = await builder.get_its_strategy(
+        strategy_name=config.selection_strategy,
+        pipeline_type=PipelineTypeEnum.TOOL_USE,
+        stage_type=StageTypeEnum.SELECTION,
+    )
+    fn_description = ("\n".join(f"- **{fn_ref}**: {function_map[fn_ref].description or 'No description provided.'}"
+                                for fn_ref in config.augmented_fns))
+    # 3) Create the inner function to handle single (non-streaming) calls.
+    async def single_inner(tool_list: ToolUselist) -> ToolUselist:
+        """
+        Orchestrates multiple tool usages, optionally using search/editing/scoring/selection steps.
+        """
+        # Convert each ToolUseInputSchema to ITSItem
+        its_items = []
+        for t in tool_list.tools:
+            item = ITSItem(
+                input=t.task_description,  # The user "task"
+                output=None,
+                name=t.tool_name,  # The "tool name"
+                metadata=t.motivation,  # The "justification"
+            )
+            its_items.append(item)
+        # Run search strategy if present
+        if search is not None:
+            its_items = await search.ainvoke(its_items)
+        logger.info("ITS orchestration function: %d items after search", len(its_items))
+        # Invoke the correct augmented function for each item concurrently
+        # Helper coroutine to invoke a tool function and capture result or error
+        async def _invoke_tool(item: ITSItem, fn):
+            try:
+                result = await fn.acall_invoke(item.output)
+                return item, result, None
+            except Exception as e:
+                logger.error(f"Error invoking function '{item.name}': {e}")
+                return item, None, str(e)
+        tasks = []
+        for item in its_items:
+            if item.name not in function_map:
+                logger.error(f"Function '{item.name}' not found in function map.")
+                item.output = f"Error: Function '{item.name}' not found in function map. Check your input"
+            else:
+                fn = function_map[item.name]
+                tasks.append(_invoke_tool(item, fn))
+        # Await all tasks and assign outputs
+        if tasks:
+            results = await asyncio.gather(*tasks)
+            for item, result, error in results:
+                if error:
+                    item.output = f"Error invoking function '{item.name}': {error}"
+                else:
+                    item.output = result
+        if editing:
+            its_items = await editing.ainvoke(its_items)
+        # Run scoring strategy if present
+        if scoring is not None:
+            its_items = await scoring.ainvoke(its_items)
+        # Run selection strategy
+        if selection is not None:
+            its_items = await selection.ainvoke(its_items)
+        logger.info("ITS orchestration function: %d items after selection", len(its_items))
+        # Convert final results from ITSItems back to a ToolUselist
+        final_list = ToolUselist(tools=[])
+        for item in its_items:
+            # Compose a new ToolUseInputSchema with final output
+            new_tool = ToolUseInputSchema(
+                tool_name=item.name,
+                task_description=str(item.input),
+                motivation=item.metadata if item.metadata else None,
+                output=str(item.output) if item.output is not None else None,
+            )
+            final_list.tools.append(new_tool)
+        return final_list
+    # 4) Return the function info (only a single_fn is needed; no streaming)
+    yield FunctionInfo.create(
+        single_fn=single_inner,
+        stream_fn=None,  # No streaming required
+        input_schema=ToolUselist,
+        single_output_schema=ToolUselist,
+        description=fn_description)

aiqtoolkit 1.2.0.dev0__py3-none-any.whl → 1.2.0rc2__py3-none-any.whl

Potentially problematic release.

aiqtoolkit 1.2.0.dev0py3-none-any.whl → 1.2.0rc2py3-none-any.whl