PyPI - aiqtoolkit - Versions diffs - 1.1.0rc6__py3-none-any.whl → 1.2.0__py3-none-any.whl - Mend

aiqtoolkit 1.1.0rc6py3-none-any.whl → 1.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of aiqtoolkit might be problematic. Click here for more details.

Files changed (319) hide show

aiqtoolkit-1.2.0.dist-info/METADATA +29 -0
aiqtoolkit-1.2.0.dist-info/RECORD +4 -0
{aiqtoolkit-1.1.0rc6.dist-info → aiqtoolkit-1.2.0.dist-info}/WHEEL +1 -1
aiqtoolkit-1.2.0.dist-info/top_level.txt +1 -0
aiq/agent/__init__.py +0 -0
aiq/agent/base.py +0 -76
aiq/agent/dual_node.py +0 -67
aiq/agent/react_agent/__init__.py +0 -0
aiq/agent/react_agent/agent.py +0 -322
aiq/agent/react_agent/output_parser.py +0 -104
aiq/agent/react_agent/prompt.py +0 -46
aiq/agent/react_agent/register.py +0 -148
aiq/agent/reasoning_agent/__init__.py +0 -0
aiq/agent/reasoning_agent/reasoning_agent.py +0 -224
aiq/agent/register.py +0 -23
aiq/agent/rewoo_agent/__init__.py +0 -0
aiq/agent/rewoo_agent/agent.py +0 -410
aiq/agent/rewoo_agent/prompt.py +0 -108
aiq/agent/rewoo_agent/register.py +0 -158
aiq/agent/tool_calling_agent/__init__.py +0 -0
aiq/agent/tool_calling_agent/agent.py +0 -123
aiq/agent/tool_calling_agent/register.py +0 -105
aiq/builder/__init__.py +0 -0
aiq/builder/builder.py +0 -223
aiq/builder/component_utils.py +0 -303
aiq/builder/context.py +0 -227
aiq/builder/embedder.py +0 -24
aiq/builder/eval_builder.py +0 -120
aiq/builder/evaluator.py +0 -29
aiq/builder/framework_enum.py +0 -24
aiq/builder/front_end.py +0 -73
aiq/builder/function.py +0 -297
aiq/builder/function_base.py +0 -376
aiq/builder/function_info.py +0 -627
aiq/builder/intermediate_step_manager.py +0 -176
aiq/builder/llm.py +0 -25
aiq/builder/retriever.py +0 -25
aiq/builder/user_interaction_manager.py +0 -71
aiq/builder/workflow.py +0 -143
aiq/builder/workflow_builder.py +0 -757
aiq/cli/__init__.py +0 -14
aiq/cli/cli_utils/__init__.py +0 -0
aiq/cli/cli_utils/config_override.py +0 -231
aiq/cli/cli_utils/validation.py +0 -37
aiq/cli/commands/__init__.py +0 -0
aiq/cli/commands/configure/__init__.py +0 -0
aiq/cli/commands/configure/channel/__init__.py +0 -0
aiq/cli/commands/configure/channel/add.py +0 -28
aiq/cli/commands/configure/channel/channel.py +0 -36
aiq/cli/commands/configure/channel/remove.py +0 -30
aiq/cli/commands/configure/channel/update.py +0 -30
aiq/cli/commands/configure/configure.py +0 -33
aiq/cli/commands/evaluate.py +0 -139
aiq/cli/commands/info/__init__.py +0 -14
aiq/cli/commands/info/info.py +0 -39
aiq/cli/commands/info/list_channels.py +0 -32
aiq/cli/commands/info/list_components.py +0 -129
aiq/cli/commands/info/list_mcp.py +0 -126
aiq/cli/commands/registry/__init__.py +0 -14
aiq/cli/commands/registry/publish.py +0 -88
aiq/cli/commands/registry/pull.py +0 -118
aiq/cli/commands/registry/registry.py +0 -38
aiq/cli/commands/registry/remove.py +0 -108
aiq/cli/commands/registry/search.py +0 -155
aiq/cli/commands/start.py +0 -250
aiq/cli/commands/uninstall.py +0 -83
aiq/cli/commands/validate.py +0 -47
aiq/cli/commands/workflow/__init__.py +0 -14
aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
aiq/cli/commands/workflow/templates/config.yml.j2 +0 -16
aiq/cli/commands/workflow/templates/pyproject.toml.j2 +0 -22
aiq/cli/commands/workflow/templates/register.py.j2 +0 -5
aiq/cli/commands/workflow/templates/workflow.py.j2 +0 -36
aiq/cli/commands/workflow/workflow.py +0 -37
aiq/cli/commands/workflow/workflow_commands.py +0 -313
aiq/cli/entrypoint.py +0 -133
aiq/cli/main.py +0 -44
aiq/cli/register_workflow.py +0 -408
aiq/cli/type_registry.py +0 -879
aiq/data_models/__init__.py +0 -14
aiq/data_models/api_server.py +0 -588
aiq/data_models/common.py +0 -143
aiq/data_models/component.py +0 -46
aiq/data_models/component_ref.py +0 -135
aiq/data_models/config.py +0 -349
aiq/data_models/dataset_handler.py +0 -122
aiq/data_models/discovery_metadata.py +0 -286
aiq/data_models/embedder.py +0 -26
aiq/data_models/evaluate.py +0 -104
aiq/data_models/evaluator.py +0 -26
aiq/data_models/front_end.py +0 -26
aiq/data_models/function.py +0 -30
aiq/data_models/function_dependencies.py +0 -64
aiq/data_models/interactive.py +0 -237
aiq/data_models/intermediate_step.py +0 -269
aiq/data_models/invocation_node.py +0 -38
aiq/data_models/llm.py +0 -26
aiq/data_models/logging.py +0 -26
aiq/data_models/memory.py +0 -26
aiq/data_models/profiler.py +0 -53
aiq/data_models/registry_handler.py +0 -26
aiq/data_models/retriever.py +0 -30
aiq/data_models/step_adaptor.py +0 -64
aiq/data_models/streaming.py +0 -33
aiq/data_models/swe_bench_model.py +0 -54
aiq/data_models/telemetry_exporter.py +0 -26
aiq/embedder/__init__.py +0 -0
aiq/embedder/langchain_client.py +0 -41
aiq/embedder/nim_embedder.py +0 -58
aiq/embedder/openai_embedder.py +0 -42
aiq/embedder/register.py +0 -24
aiq/eval/__init__.py +0 -14
aiq/eval/config.py +0 -42
aiq/eval/dataset_handler/__init__.py +0 -0
aiq/eval/dataset_handler/dataset_downloader.py +0 -106
aiq/eval/dataset_handler/dataset_filter.py +0 -52
aiq/eval/dataset_handler/dataset_handler.py +0 -169
aiq/eval/evaluate.py +0 -325
aiq/eval/evaluator/__init__.py +0 -14
aiq/eval/evaluator/evaluator_model.py +0 -44
aiq/eval/intermediate_step_adapter.py +0 -93
aiq/eval/rag_evaluator/__init__.py +0 -0
aiq/eval/rag_evaluator/evaluate.py +0 -138
aiq/eval/rag_evaluator/register.py +0 -138
aiq/eval/register.py +0 -23
aiq/eval/remote_workflow.py +0 -128
aiq/eval/runtime_event_subscriber.py +0 -52
aiq/eval/swe_bench_evaluator/__init__.py +0 -0
aiq/eval/swe_bench_evaluator/evaluate.py +0 -215
aiq/eval/swe_bench_evaluator/register.py +0 -36
aiq/eval/trajectory_evaluator/__init__.py +0 -0
aiq/eval/trajectory_evaluator/evaluate.py +0 -118
aiq/eval/trajectory_evaluator/register.py +0 -40
aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
aiq/eval/tunable_rag_evaluator/evaluate.py +0 -263
aiq/eval/tunable_rag_evaluator/register.py +0 -50
aiq/eval/utils/__init__.py +0 -0
aiq/eval/utils/output_uploader.py +0 -131
aiq/eval/utils/tqdm_position_registry.py +0 -40
aiq/front_ends/__init__.py +0 -14
aiq/front_ends/console/__init__.py +0 -14
aiq/front_ends/console/console_front_end_config.py +0 -32
aiq/front_ends/console/console_front_end_plugin.py +0 -107
aiq/front_ends/console/register.py +0 -25
aiq/front_ends/cron/__init__.py +0 -14
aiq/front_ends/fastapi/__init__.py +0 -14
aiq/front_ends/fastapi/fastapi_front_end_config.py +0 -150
aiq/front_ends/fastapi/fastapi_front_end_plugin.py +0 -103
aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +0 -607
aiq/front_ends/fastapi/intermediate_steps_subscriber.py +0 -80
aiq/front_ends/fastapi/job_store.py +0 -161
aiq/front_ends/fastapi/main.py +0 -70
aiq/front_ends/fastapi/message_handler.py +0 -279
aiq/front_ends/fastapi/message_validator.py +0 -345
aiq/front_ends/fastapi/register.py +0 -25
aiq/front_ends/fastapi/response_helpers.py +0 -195
aiq/front_ends/fastapi/step_adaptor.py +0 -320
aiq/front_ends/fastapi/websocket.py +0 -148
aiq/front_ends/mcp/__init__.py +0 -14
aiq/front_ends/mcp/mcp_front_end_config.py +0 -32
aiq/front_ends/mcp/mcp_front_end_plugin.py +0 -93
aiq/front_ends/mcp/register.py +0 -27
aiq/front_ends/mcp/tool_converter.py +0 -242
aiq/front_ends/register.py +0 -22
aiq/front_ends/simple_base/__init__.py +0 -14
aiq/front_ends/simple_base/simple_front_end_plugin_base.py +0 -52
aiq/llm/__init__.py +0 -0
aiq/llm/nim_llm.py +0 -45
aiq/llm/openai_llm.py +0 -45
aiq/llm/register.py +0 -22
aiq/llm/utils/__init__.py +0 -14
aiq/llm/utils/env_config_value.py +0 -94
aiq/llm/utils/error.py +0 -17
aiq/memory/__init__.py +0 -20
aiq/memory/interfaces.py +0 -183
aiq/memory/models.py +0 -112
aiq/meta/module_to_distro.json +0 -3
aiq/meta/pypi.md +0 -58
aiq/observability/__init__.py +0 -0
aiq/observability/async_otel_listener.py +0 -429
aiq/observability/register.py +0 -99
aiq/plugins/.namespace +0 -1
aiq/profiler/__init__.py +0 -0
aiq/profiler/callbacks/__init__.py +0 -0
aiq/profiler/callbacks/agno_callback_handler.py +0 -295
aiq/profiler/callbacks/base_callback_class.py +0 -20
aiq/profiler/callbacks/langchain_callback_handler.py +0 -278
aiq/profiler/callbacks/llama_index_callback_handler.py +0 -205
aiq/profiler/callbacks/semantic_kernel_callback_handler.py +0 -238
aiq/profiler/callbacks/token_usage_base_model.py +0 -27
aiq/profiler/data_frame_row.py +0 -51
aiq/profiler/decorators/__init__.py +0 -0
aiq/profiler/decorators/framework_wrapper.py +0 -131
aiq/profiler/decorators/function_tracking.py +0 -254
aiq/profiler/forecasting/__init__.py +0 -0
aiq/profiler/forecasting/config.py +0 -18
aiq/profiler/forecasting/model_trainer.py +0 -75
aiq/profiler/forecasting/models/__init__.py +0 -22
aiq/profiler/forecasting/models/forecasting_base_model.py +0 -40
aiq/profiler/forecasting/models/linear_model.py +0 -196
aiq/profiler/forecasting/models/random_forest_regressor.py +0 -268
aiq/profiler/inference_metrics_model.py +0 -25
aiq/profiler/inference_optimization/__init__.py +0 -0
aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +0 -452
aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +0 -258
aiq/profiler/inference_optimization/data_models.py +0 -386
aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +0 -468
aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +0 -405
aiq/profiler/inference_optimization/llm_metrics.py +0 -212
aiq/profiler/inference_optimization/prompt_caching.py +0 -163
aiq/profiler/inference_optimization/token_uniqueness.py +0 -107
aiq/profiler/inference_optimization/workflow_runtimes.py +0 -72
aiq/profiler/intermediate_property_adapter.py +0 -102
aiq/profiler/profile_runner.py +0 -433
aiq/profiler/utils.py +0 -184
aiq/registry_handlers/__init__.py +0 -0
aiq/registry_handlers/local/__init__.py +0 -0
aiq/registry_handlers/local/local_handler.py +0 -176
aiq/registry_handlers/local/register_local.py +0 -37
aiq/registry_handlers/metadata_factory.py +0 -60
aiq/registry_handlers/package_utils.py +0 -198
aiq/registry_handlers/pypi/__init__.py +0 -0
aiq/registry_handlers/pypi/pypi_handler.py +0 -251
aiq/registry_handlers/pypi/register_pypi.py +0 -40
aiq/registry_handlers/register.py +0 -21
aiq/registry_handlers/registry_handler_base.py +0 -157
aiq/registry_handlers/rest/__init__.py +0 -0
aiq/registry_handlers/rest/register_rest.py +0 -56
aiq/registry_handlers/rest/rest_handler.py +0 -237
aiq/registry_handlers/schemas/__init__.py +0 -0
aiq/registry_handlers/schemas/headers.py +0 -42
aiq/registry_handlers/schemas/package.py +0 -68
aiq/registry_handlers/schemas/publish.py +0 -63
aiq/registry_handlers/schemas/pull.py +0 -82
aiq/registry_handlers/schemas/remove.py +0 -36
aiq/registry_handlers/schemas/search.py +0 -91
aiq/registry_handlers/schemas/status.py +0 -47
aiq/retriever/__init__.py +0 -0
aiq/retriever/interface.py +0 -37
aiq/retriever/milvus/__init__.py +0 -14
aiq/retriever/milvus/register.py +0 -81
aiq/retriever/milvus/retriever.py +0 -228
aiq/retriever/models.py +0 -74
aiq/retriever/nemo_retriever/__init__.py +0 -14
aiq/retriever/nemo_retriever/register.py +0 -60
aiq/retriever/nemo_retriever/retriever.py +0 -190
aiq/retriever/register.py +0 -22
aiq/runtime/__init__.py +0 -14
aiq/runtime/loader.py +0 -188
aiq/runtime/runner.py +0 -176
aiq/runtime/session.py +0 -140
aiq/runtime/user_metadata.py +0 -131
aiq/settings/__init__.py +0 -0
aiq/settings/global_settings.py +0 -318
aiq/test/.namespace +0 -1
aiq/tool/__init__.py +0 -0
aiq/tool/code_execution/__init__.py +0 -0
aiq/tool/code_execution/code_sandbox.py +0 -188
aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +0 -60
aiq/tool/code_execution/local_sandbox/__init__.py +0 -13
aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +0 -83
aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +0 -4
aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +0 -25
aiq/tool/code_execution/register.py +0 -70
aiq/tool/code_execution/utils.py +0 -100
aiq/tool/datetime_tools.py +0 -42
aiq/tool/document_search.py +0 -141
aiq/tool/github_tools/__init__.py +0 -0
aiq/tool/github_tools/create_github_commit.py +0 -133
aiq/tool/github_tools/create_github_issue.py +0 -87
aiq/tool/github_tools/create_github_pr.py +0 -106
aiq/tool/github_tools/get_github_file.py +0 -106
aiq/tool/github_tools/get_github_issue.py +0 -166
aiq/tool/github_tools/get_github_pr.py +0 -256
aiq/tool/github_tools/update_github_issue.py +0 -100
aiq/tool/mcp/__init__.py +0 -14
aiq/tool/mcp/mcp_client.py +0 -220
aiq/tool/mcp/mcp_tool.py +0 -95
aiq/tool/memory_tools/__init__.py +0 -0
aiq/tool/memory_tools/add_memory_tool.py +0 -79
aiq/tool/memory_tools/delete_memory_tool.py +0 -67
aiq/tool/memory_tools/get_memory_tool.py +0 -72
aiq/tool/nvidia_rag.py +0 -95
aiq/tool/register.py +0 -37
aiq/tool/retriever.py +0 -89
aiq/tool/server_tools.py +0 -63
aiq/utils/__init__.py +0 -0
aiq/utils/data_models/__init__.py +0 -0
aiq/utils/data_models/schema_validator.py +0 -58
aiq/utils/debugging_utils.py +0 -43
aiq/utils/exception_handlers/__init__.py +0 -0
aiq/utils/exception_handlers/schemas.py +0 -114
aiq/utils/io/__init__.py +0 -0
aiq/utils/io/yaml_tools.py +0 -119
aiq/utils/metadata_utils.py +0 -74
aiq/utils/optional_imports.py +0 -142
aiq/utils/producer_consumer_queue.py +0 -178
aiq/utils/reactive/__init__.py +0 -0
aiq/utils/reactive/base/__init__.py +0 -0
aiq/utils/reactive/base/observable_base.py +0 -65
aiq/utils/reactive/base/observer_base.py +0 -55
aiq/utils/reactive/base/subject_base.py +0 -79
aiq/utils/reactive/observable.py +0 -59
aiq/utils/reactive/observer.py +0 -76
aiq/utils/reactive/subject.py +0 -131
aiq/utils/reactive/subscription.py +0 -49
aiq/utils/settings/__init__.py +0 -0
aiq/utils/settings/global_settings.py +0 -197
aiq/utils/type_converter.py +0 -232
aiq/utils/type_utils.py +0 -397
aiq/utils/url_utils.py +0 -27
aiqtoolkit-1.1.0rc6.dist-info/METADATA +0 -331
aiqtoolkit-1.1.0rc6.dist-info/RECORD +0 -316
aiqtoolkit-1.1.0rc6.dist-info/entry_points.txt +0 -17
aiqtoolkit-1.1.0rc6.dist-info/licenses/LICENSE-3rd-party.txt +0 -3686
aiqtoolkit-1.1.0rc6.dist-info/licenses/LICENSE.md +0 -201
aiqtoolkit-1.1.0rc6.dist-info/top_level.txt +0 -1

aiq/profiler/inference_optimization/prompt_caching.py DELETED Viewed

@@ -1,163 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-from aiq.data_models.intermediate_step import IntermediateStep
-from aiq.profiler.inference_optimization.data_models import CommonPrefixesOutput
-from aiq.profiler.inference_optimization.data_models import FrameworkLLMPrefixData
-from aiq.profiler.inference_optimization.data_models import PrefixInfo
-from aiq.profiler.utils import create_standardized_dataframe
-# -----------------------------------------------------------
-# 1. Helper: Build a prefix trie
-# -----------------------------------------------------------
-def build_prefix_trie(strings: list[str]) -> dict:
-    """
-    Build a trie from a list of strings.
-    Returns a nested dictionary with::
-        {
-            'count': int,         # number of strings passing through this node
-            'children': dict[str, TrieNode]
-        }
-    """
-    root = {'count': 0, 'children': {}}
-    for s in strings:
-        node = root
-        node['count'] += 1  # every string passes through the root
-        for ch in s:
-            if ch not in node['children']:
-                node['children'][ch] = {'count': 0, 'children': {}}
-            node = node['children'][ch]
-            node['count'] += 1
-    return root
-# -----------------------------------------------------------
-# 2. Helper: Iterative traversal of the trie
-# -----------------------------------------------------------
-def collect_prefixes_iterative(root: dict, total_calls: int) -> list[dict]:
-    """
-    Iteratively traverse the trie to collect prefix statistics,
-    avoiding recursion depth limits.
-    :param root: Trie node with 'count' and 'children'
-    :param total_calls: Number of total calls in this group (denominator for percentages)
-    :return: A list of dicts, each dict containing prefix info
-    """
-    results = []
-    # stack holds (node, prefix_so_far)
-    stack = [(root, "")]
-    while stack:
-        node, prefix = stack.pop()
-        # Skip storing the empty root prefix
-        if prefix:
-            calls_count = node['count']
-            calls_percentage = calls_count / total_calls
-            results.append({
-                'prefix': prefix,
-                'prefix_length': len(prefix),
-                'calls_count': calls_count,
-                'calls_percentage': calls_percentage
-            })
-        # Add children to the stack
-        for ch, child_node in node['children'].items():
-            stack.append((child_node, prefix + ch))
-    return results
-# -----------------------------------------------------------
-# 3. Main Function
-# -----------------------------------------------------------
-def get_common_prefixes(all_steps: list[list[IntermediateStep]],
-                        min_call_percentage: float = 0.0) -> CommonPrefixesOutput:
-    """
-    Given a pandas DataFrame with columns 'framework', 'llm_name',
-    and 'llm_text_input', return a Pydantic-validated RootModel
-    keyed by "<llm_name>" with a sorted list of
-    common prefix statistics.
-    1) Only includes prefixes with calls_percentage >= `min_call_percentage`.
-    2) Excludes any prefix that is a substring of another (longer) prefix
-       that already meets the threshold and is retained.
-    3) Optionally writes the resulting dictionary to JSON if `output_path` is provided.
-    :param all_steps: Intermediate Steps
-    :param min_call_percentage: Exclude prefixes that appear in fewer than this fraction
-                                of total calls. (Default 0.0 = no filtering)
-    Sorting: primarily by prefix length (descending),
-             secondarily by frequency (descending).
-    """
-    # Validate necessary columns
-    df = create_standardized_dataframe(all_steps)
-    required_cols = {'framework', 'llm_name', 'llm_text_input'}
-    if not required_cols.issubset(df.columns):
-        missing = required_cols - set(df.columns)
-        raise ValueError(f"DataFrame missing required columns: {missing}")
-    output_data: dict[str, FrameworkLLMPrefixData] = {}
-    # Group DataFrame by (framework, llm_name)
-    grouped = df.groupby(['llm_name'])
-    for llm_name, group_df in grouped:
-        # Unpack llm_name Tuple
-        llm_name = llm_name[0]
-        text_inputs = group_df['llm_text_input'].astype(str).tolist()
-        total_calls = len(text_inputs)
-        # Build trie for all text inputs
-        trie = build_prefix_trie(text_inputs)
-        # Collect prefix info using iterative traversal
-        results = collect_prefixes_iterative(trie, total_calls=total_calls)
-        # 1) Filter out prefixes below min_call_percentage
-        results_filtered = [r for r in results if r['calls_percentage'] >= min_call_percentage]
-        # 2) Sort results: prefix_length desc, then calls_count desc
-        results_sorted = sorted(results_filtered, key=lambda x: (x['prefix_length'], x['calls_count']), reverse=True)
-        # 3) Substring filtering:
-        #    Because results_sorted is in descending length order,
-        #    if we keep a prefix, we exclude any shorter prefix that
-        #    is a substring of that already-kept prefix.
-        final_results = []
-        for r in results_sorted:
-            pfx = r['prefix']
-            # Check if this prefix is contained in any longer prefix we have kept
-            if not any(pfx in kept['prefix'] for kept in final_results):
-                final_results.append(r)
-        # Convert each dict to a PrefixInfo model
-        prefix_info_list = [PrefixInfo(**res) for res in final_results]
-        # Construct the dictionary key
-        framework_llm_key = f"{llm_name}"
-        # Save the data for this group
-        output_data[framework_llm_key] = FrameworkLLMPrefixData(total_calls=total_calls, prefix_info=prefix_info_list)
-    # Package the final result in a validated RootModel
-    result_model = CommonPrefixesOutput(root=output_data)
-    return result_model

aiq/profiler/inference_optimization/token_uniqueness.py DELETED Viewed

@@ -1,107 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import re
-import numpy as np
-from aiq.data_models.intermediate_step import IntermediateStep
-from aiq.profiler.inference_optimization.data_models import LLMUniquenessMetrics
-from aiq.profiler.inference_optimization.data_models import LLMUniquenessMetricsByLLM
-from aiq.profiler.utils import create_standardized_dataframe
-# ----------------------------------------------------------------
-# 1. Main Function
-# ----------------------------------------------------------------
-def compute_inter_query_token_uniqueness_by_llm(all_steps: list[list[IntermediateStep]]) -> LLMUniquenessMetricsByLLM:
-    """
-    Computes p90, p95, and p99 of 'new words added' between consecutive llm_start events,
-    grouped by (llm_name, example_number).
-    Steps:
-    1. Filter df to only llm_start events.
-    2. Group first by (llm_name, example_number), then sort by event_timestamp in each group.
-    3. Compare each llm_text_input to the previous one in the same group to find how many new words appear.
-    4. Aggregate all 'new words count' across each llm_name, compute p90/p95/p99 for each LLM.
-    5. Return a Pydantic RootModel containing a dictionary::
-         { llm_name -> LLMUniquenessMetrics(p90, p95, p99) }.
-    """
-    df = create_standardized_dataframe(all_steps)
-    # Validate that the necessary columns exist
-    required_cols = {'event_type', 'llm_name', 'example_number', 'event_timestamp', 'llm_text_input'}
-    missing = required_cols - set(df.columns)
-    if missing:
-        raise ValueError(f"DataFrame missing required columns: {missing}")
-    # 1) Filter to llm_start events
-    cdf = df[df['event_type'] == 'LLM_START'].copy()
-    if cdf.empty:
-        # Return an empty dictionary if no llm_start events
-        return LLMUniquenessMetricsByLLM(root={})
-    # Helper to tokenize text into a set of words
-    def tokenize_to_set(text: str) -> set:
-        if not isinstance(text, str):
-            return set()
-        return set(re.findall(r"\w+", text.lower()))
-    # We'll store new_words counts for each llm_name
-    llm_to_counts: dict[str, list[int]] = {}
-    # 2) Group by (llm_name, example_number), then sort each group
-    grouped = cdf.groupby(['llm_name', 'example_number'], as_index=False, group_keys=True)
-    for (llm, ex_num), group_df in grouped:  # pylint: disable=unused-variable
-        # Sort by event_timestamp
-        group_df = group_df.sort_values('event_timestamp', ascending=True)
-        # Shift the llm_text_input to compare consecutive calls
-        group_df['prev_llm_text_input'] = group_df['llm_text_input'].shift(1)
-        # Compute new words for each row (excluding the first in the group)
-        def compute_new_words(row):
-            current_tokens = tokenize_to_set(row['llm_text_input'])
-            prev_tokens = tokenize_to_set(row['prev_llm_text_input'])
-            return len(current_tokens - prev_tokens)
-        group_df['new_words_count'] = group_df.apply(compute_new_words, axis=1)
-        # Drop rows where there's no 'previous' call
-        valid_rows = group_df.dropna(subset=['prev_llm_text_input'])
-        # Gather the new_words_count
-        counts = valid_rows['new_words_count'].tolist()
-        if counts:
-            # Accumulate them in llm_to_counts
-            if llm not in llm_to_counts:
-                llm_to_counts[llm] = []
-            llm_to_counts[llm].extend(counts)
-    # 4) For each llm_name, compute p90, p95, p99
-    output_dict = {}
-    for llm_name, counts_list in llm_to_counts.items():
-        arr = np.array(counts_list)
-        p90_val = float(np.percentile(arr, 90))
-        p95_val = float(np.percentile(arr, 95))
-        p99_val = float(np.percentile(arr, 99))
-        output_dict[llm_name] = LLMUniquenessMetrics(p90=p90_val, p95=p95_val, p99=p99_val)
-    ret_val = LLMUniquenessMetricsByLLM(root=output_dict)
-    # Validate & return as a RootModel
-    return ret_val

aiq/profiler/inference_optimization/workflow_runtimes.py DELETED Viewed

@@ -1,72 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import numpy as np
-from aiq.data_models.intermediate_step import IntermediateStep
-from aiq.profiler.inference_optimization.data_models import WorkflowRuntimeMetrics
-from aiq.profiler.utils import create_standardized_dataframe
-def compute_workflow_runtime_metrics(all_steps: list[list[IntermediateStep]]) -> WorkflowRuntimeMetrics:
-    """
-    Computes the p90, p95, and p99 of workflow runtime for each example_number.
-    The 'workflow runtime' per example is::
-        max(event_timestamp) - min(event_timestamp)
-    for that example_number.
-    Parameters
-    ----------
-    all_steps : IntermediateStep
-        Must contain at least two columns:
-          - 'example_number'
-          - 'event_timestamp'
-    Returns
-    -------
-    WorkflowRuntimeMetrics
-        A Pydantic model with 'p90', 'p95', and 'p99' attributes.
-    """
-    df = create_standardized_dataframe(all_steps)
-    required_cols = {"example_number", "event_timestamp"}
-    missing = required_cols - set(df.columns)
-    if missing:
-        raise ValueError(f"DataFrame is missing required columns: {missing}")
-    # Group by example_number, then find min and max timestamp
-    grouped = df.groupby("example_number")["event_timestamp"]
-    min_timestamps = grouped.min()
-    max_timestamps = grouped.max()
-    # Workflow runtime is difference between max and min
-    runtimes = max_timestamps - min_timestamps
-    # Convert to a NumPy array for percentile calculations
-    runtimes_arr = runtimes.values
-    # Edge case: if there's only one example or no data
-    # (NumPy percentile can handle 1-element arrays, but let's guard for empties)
-    if len(runtimes_arr) == 0:
-        return WorkflowRuntimeMetrics(p90=0.0, p95=0.0, p99=0.0)
-    # Compute p90, p95, p99
-    p90_val = float(np.percentile(runtimes_arr, 90))
-    p95_val = float(np.percentile(runtimes_arr, 95))
-    p99_val = float(np.percentile(runtimes_arr, 99))
-    return WorkflowRuntimeMetrics(p90=p90_val, p95=p95_val, p99=p99_val)

aiq/profiler/intermediate_property_adapter.py DELETED Viewed

@@ -1,102 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-from aiq.data_models.intermediate_step import IntermediateStep
-from aiq.data_models.intermediate_step import IntermediateStepType
-from aiq.data_models.intermediate_step import TokenUsageBaseModel
-class IntermediatePropertyAdaptor(IntermediateStep):
-    @classmethod
-    def from_intermediate_step(cls, step: IntermediateStep) -> "IntermediatePropertyAdaptor":
-        """
-        Create an adaptor instance from an existing IntermediateStep.
-        Uses the dict() representation of the instance to initialize the adaptor.
-        """
-        return cls(**step.model_dump())
-    @property
-    def token_usage(self) -> TokenUsageBaseModel:
-        return self.payload.usage_info.token_usage if self.payload.usage_info else TokenUsageBaseModel()
-    @property
-    def seconds_between_calls(self) -> int:
-        return self.payload.usage_info.seconds_between_calls if self.payload.usage_info else 0
-    @property
-    def llm_text_input(self) -> str:
-        ret = ""
-        if self.payload.data and self.event_type == IntermediateStepType.LLM_START:
-            ret = self.payload.data.input
-        return ret
-    @property
-    def llm_text_output(self) -> str:
-        ret = ""
-        if self.payload.data and self.event_type == IntermediateStepType.LLM_END:
-            ret = self.payload.data.output
-        return ret
-    @property
-    def llm_text_chunk(self) -> str:
-        ret = ""
-        if self.payload.data and self.event_type == IntermediateStepType.LLM_NEW_TOKEN:
-            ret = self.payload.data.chunk
-        return ret
-    @property
-    def tool_input(self) -> str:
-        ret = ""
-        if self.payload.data and self.event_type == IntermediateStepType.TOOL_START:
-            ret = self.payload.data.input
-        return ret
-    @property
-    def tool_output(self) -> str:
-        ret = ""
-        if self.payload.data and self.event_type == IntermediateStepType.TOOL_END:
-            ret = self.payload.data.output
-        return ret
-    @property
-    def llm_name(self) -> str:
-        ret = ""
-        if self.payload.name and self.event_type in [IntermediateStepType.LLM_START, IntermediateStepType.LLM_END]:
-            ret = self.payload.name
-        return ret
-    @property
-    def tool_name(self) -> str:
-        ret = ""
-        if self.payload.name and self.event_type in [IntermediateStepType.TOOL_START, IntermediateStepType.TOOL_END]:
-            ret = self.payload.name
-        return ret
-    @property
-    def function_name(self) -> str:
-        return self.function_ancestry.function_name
-    @property
-    def function_id(self) -> str:
-        return self.function_ancestry.function_id
-    @property
-    def parent_function_id(self) -> str:
-        return self.function_ancestry.parent_id
-    @property
-    def parent_function_name(self) -> str:
-        return self.function_ancestry.parent_name

aiqtoolkit 1.1.0rc6__py3-none-any.whl → 1.2.0__py3-none-any.whl

Potentially problematic release.

aiqtoolkit 1.1.0rc6py3-none-any.whl → 1.2.0py3-none-any.whl