PyPI - aiqtoolkit - Versions diffs - 1.2.0rc4__py3-none-any.whl → 1.2rc9__py3-none-any.whl - Mend

aiqtoolkit 1.2.0rc4py3-none-any.whl → 1.2rc9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of aiqtoolkit might be problematic. Click here for more details.

Files changed (441) hide show

aiqtoolkit-1.2rc9.dist-info/METADATA +29 -0
aiqtoolkit-1.2rc9.dist-info/RECORD +4 -0
aiqtoolkit-1.2rc9.dist-info/top_level.txt +1 -0
aiq/agent/__init__.py +0 -0
aiq/agent/base.py +0 -239
aiq/agent/dual_node.py +0 -67
aiq/agent/react_agent/__init__.py +0 -0
aiq/agent/react_agent/agent.py +0 -355
aiq/agent/react_agent/output_parser.py +0 -104
aiq/agent/react_agent/prompt.py +0 -41
aiq/agent/react_agent/register.py +0 -149
aiq/agent/reasoning_agent/__init__.py +0 -0
aiq/agent/reasoning_agent/reasoning_agent.py +0 -225
aiq/agent/register.py +0 -23
aiq/agent/rewoo_agent/__init__.py +0 -0
aiq/agent/rewoo_agent/agent.py +0 -411
aiq/agent/rewoo_agent/prompt.py +0 -108
aiq/agent/rewoo_agent/register.py +0 -158
aiq/agent/tool_calling_agent/__init__.py +0 -0
aiq/agent/tool_calling_agent/agent.py +0 -119
aiq/agent/tool_calling_agent/register.py +0 -106
aiq/authentication/__init__.py +0 -14
aiq/authentication/api_key/__init__.py +0 -14
aiq/authentication/api_key/api_key_auth_provider.py +0 -96
aiq/authentication/api_key/api_key_auth_provider_config.py +0 -124
aiq/authentication/api_key/register.py +0 -26
aiq/authentication/exceptions/__init__.py +0 -14
aiq/authentication/exceptions/api_key_exceptions.py +0 -38
aiq/authentication/exceptions/auth_code_grant_exceptions.py +0 -86
aiq/authentication/exceptions/call_back_exceptions.py +0 -38
aiq/authentication/exceptions/request_exceptions.py +0 -54
aiq/authentication/http_basic_auth/__init__.py +0 -0
aiq/authentication/http_basic_auth/http_basic_auth_provider.py +0 -81
aiq/authentication/http_basic_auth/register.py +0 -30
aiq/authentication/interfaces.py +0 -93
aiq/authentication/oauth2/__init__.py +0 -14
aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +0 -107
aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +0 -39
aiq/authentication/oauth2/register.py +0 -25
aiq/authentication/register.py +0 -21
aiq/builder/__init__.py +0 -0
aiq/builder/builder.py +0 -285
aiq/builder/component_utils.py +0 -316
aiq/builder/context.py +0 -264
aiq/builder/embedder.py +0 -24
aiq/builder/eval_builder.py +0 -161
aiq/builder/evaluator.py +0 -29
aiq/builder/framework_enum.py +0 -24
aiq/builder/front_end.py +0 -73
aiq/builder/function.py +0 -344
aiq/builder/function_base.py +0 -380
aiq/builder/function_info.py +0 -627
aiq/builder/intermediate_step_manager.py +0 -174
aiq/builder/llm.py +0 -25
aiq/builder/retriever.py +0 -25
aiq/builder/user_interaction_manager.py +0 -74
aiq/builder/workflow.py +0 -148
aiq/builder/workflow_builder.py +0 -1117
aiq/cli/__init__.py +0 -14
aiq/cli/cli_utils/__init__.py +0 -0
aiq/cli/cli_utils/config_override.py +0 -231
aiq/cli/cli_utils/validation.py +0 -37
aiq/cli/commands/__init__.py +0 -0
aiq/cli/commands/configure/__init__.py +0 -0
aiq/cli/commands/configure/channel/__init__.py +0 -0
aiq/cli/commands/configure/channel/add.py +0 -28
aiq/cli/commands/configure/channel/channel.py +0 -36
aiq/cli/commands/configure/channel/remove.py +0 -30
aiq/cli/commands/configure/channel/update.py +0 -30
aiq/cli/commands/configure/configure.py +0 -33
aiq/cli/commands/evaluate.py +0 -139
aiq/cli/commands/info/__init__.py +0 -14
aiq/cli/commands/info/info.py +0 -39
aiq/cli/commands/info/list_channels.py +0 -32
aiq/cli/commands/info/list_components.py +0 -129
aiq/cli/commands/info/list_mcp.py +0 -213
aiq/cli/commands/registry/__init__.py +0 -14
aiq/cli/commands/registry/publish.py +0 -88
aiq/cli/commands/registry/pull.py +0 -118
aiq/cli/commands/registry/registry.py +0 -38
aiq/cli/commands/registry/remove.py +0 -108
aiq/cli/commands/registry/search.py +0 -155
aiq/cli/commands/sizing/__init__.py +0 -14
aiq/cli/commands/sizing/calc.py +0 -297
aiq/cli/commands/sizing/sizing.py +0 -27
aiq/cli/commands/start.py +0 -246
aiq/cli/commands/uninstall.py +0 -81
aiq/cli/commands/validate.py +0 -47
aiq/cli/commands/workflow/__init__.py +0 -14
aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
aiq/cli/commands/workflow/templates/config.yml.j2 +0 -16
aiq/cli/commands/workflow/templates/pyproject.toml.j2 +0 -22
aiq/cli/commands/workflow/templates/register.py.j2 +0 -5
aiq/cli/commands/workflow/templates/workflow.py.j2 +0 -36
aiq/cli/commands/workflow/workflow.py +0 -37
aiq/cli/commands/workflow/workflow_commands.py +0 -313
aiq/cli/entrypoint.py +0 -135
aiq/cli/main.py +0 -44
aiq/cli/register_workflow.py +0 -488
aiq/cli/type_registry.py +0 -1000
aiq/data_models/__init__.py +0 -14
aiq/data_models/api_server.py +0 -694
aiq/data_models/authentication.py +0 -231
aiq/data_models/common.py +0 -171
aiq/data_models/component.py +0 -54
aiq/data_models/component_ref.py +0 -168
aiq/data_models/config.py +0 -406
aiq/data_models/dataset_handler.py +0 -123
aiq/data_models/discovery_metadata.py +0 -335
aiq/data_models/embedder.py +0 -27
aiq/data_models/evaluate.py +0 -127
aiq/data_models/evaluator.py +0 -26
aiq/data_models/front_end.py +0 -26
aiq/data_models/function.py +0 -30
aiq/data_models/function_dependencies.py +0 -72
aiq/data_models/interactive.py +0 -246
aiq/data_models/intermediate_step.py +0 -302
aiq/data_models/invocation_node.py +0 -38
aiq/data_models/its_strategy.py +0 -30
aiq/data_models/llm.py +0 -27
aiq/data_models/logging.py +0 -26
aiq/data_models/memory.py +0 -27
aiq/data_models/object_store.py +0 -44
aiq/data_models/profiler.py +0 -54
aiq/data_models/registry_handler.py +0 -26
aiq/data_models/retriever.py +0 -30
aiq/data_models/retry_mixin.py +0 -35
aiq/data_models/span.py +0 -187
aiq/data_models/step_adaptor.py +0 -64
aiq/data_models/streaming.py +0 -33
aiq/data_models/swe_bench_model.py +0 -54
aiq/data_models/telemetry_exporter.py +0 -26
aiq/embedder/__init__.py +0 -0
aiq/embedder/langchain_client.py +0 -41
aiq/embedder/nim_embedder.py +0 -59
aiq/embedder/openai_embedder.py +0 -43
aiq/embedder/register.py +0 -24
aiq/eval/__init__.py +0 -14
aiq/eval/config.py +0 -60
aiq/eval/dataset_handler/__init__.py +0 -0
aiq/eval/dataset_handler/dataset_downloader.py +0 -106
aiq/eval/dataset_handler/dataset_filter.py +0 -52
aiq/eval/dataset_handler/dataset_handler.py +0 -254
aiq/eval/evaluate.py +0 -506
aiq/eval/evaluator/__init__.py +0 -14
aiq/eval/evaluator/base_evaluator.py +0 -73
aiq/eval/evaluator/evaluator_model.py +0 -45
aiq/eval/intermediate_step_adapter.py +0 -99
aiq/eval/rag_evaluator/__init__.py +0 -0
aiq/eval/rag_evaluator/evaluate.py +0 -178
aiq/eval/rag_evaluator/register.py +0 -143
aiq/eval/register.py +0 -23
aiq/eval/remote_workflow.py +0 -133
aiq/eval/runners/__init__.py +0 -14
aiq/eval/runners/config.py +0 -39
aiq/eval/runners/multi_eval_runner.py +0 -54
aiq/eval/runtime_event_subscriber.py +0 -52
aiq/eval/swe_bench_evaluator/__init__.py +0 -0
aiq/eval/swe_bench_evaluator/evaluate.py +0 -215
aiq/eval/swe_bench_evaluator/register.py +0 -36
aiq/eval/trajectory_evaluator/__init__.py +0 -0
aiq/eval/trajectory_evaluator/evaluate.py +0 -75
aiq/eval/trajectory_evaluator/register.py +0 -40
aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
aiq/eval/tunable_rag_evaluator/evaluate.py +0 -245
aiq/eval/tunable_rag_evaluator/register.py +0 -52
aiq/eval/usage_stats.py +0 -41
aiq/eval/utils/__init__.py +0 -0
aiq/eval/utils/output_uploader.py +0 -140
aiq/eval/utils/tqdm_position_registry.py +0 -40
aiq/eval/utils/weave_eval.py +0 -184
aiq/experimental/__init__.py +0 -0
aiq/experimental/decorators/__init__.py +0 -0
aiq/experimental/decorators/experimental_warning_decorator.py +0 -130
aiq/experimental/inference_time_scaling/__init__.py +0 -0
aiq/experimental/inference_time_scaling/editing/__init__.py +0 -0
aiq/experimental/inference_time_scaling/editing/iterative_plan_refinement_editor.py +0 -147
aiq/experimental/inference_time_scaling/editing/llm_as_a_judge_editor.py +0 -204
aiq/experimental/inference_time_scaling/editing/motivation_aware_summarization.py +0 -107
aiq/experimental/inference_time_scaling/functions/__init__.py +0 -0
aiq/experimental/inference_time_scaling/functions/execute_score_select_function.py +0 -105
aiq/experimental/inference_time_scaling/functions/its_tool_orchestration_function.py +0 -205
aiq/experimental/inference_time_scaling/functions/its_tool_wrapper_function.py +0 -146
aiq/experimental/inference_time_scaling/functions/plan_select_execute_function.py +0 -224
aiq/experimental/inference_time_scaling/models/__init__.py +0 -0
aiq/experimental/inference_time_scaling/models/editor_config.py +0 -132
aiq/experimental/inference_time_scaling/models/its_item.py +0 -48
aiq/experimental/inference_time_scaling/models/scoring_config.py +0 -112
aiq/experimental/inference_time_scaling/models/search_config.py +0 -120
aiq/experimental/inference_time_scaling/models/selection_config.py +0 -154
aiq/experimental/inference_time_scaling/models/stage_enums.py +0 -43
aiq/experimental/inference_time_scaling/models/strategy_base.py +0 -66
aiq/experimental/inference_time_scaling/models/tool_use_config.py +0 -41
aiq/experimental/inference_time_scaling/register.py +0 -36
aiq/experimental/inference_time_scaling/scoring/__init__.py +0 -0
aiq/experimental/inference_time_scaling/scoring/llm_based_agent_scorer.py +0 -168
aiq/experimental/inference_time_scaling/scoring/llm_based_plan_scorer.py +0 -168
aiq/experimental/inference_time_scaling/scoring/motivation_aware_scorer.py +0 -111
aiq/experimental/inference_time_scaling/search/__init__.py +0 -0
aiq/experimental/inference_time_scaling/search/multi_llm_planner.py +0 -128
aiq/experimental/inference_time_scaling/search/multi_query_retrieval_search.py +0 -122
aiq/experimental/inference_time_scaling/search/single_shot_multi_plan_planner.py +0 -128
aiq/experimental/inference_time_scaling/selection/__init__.py +0 -0
aiq/experimental/inference_time_scaling/selection/best_of_n_selector.py +0 -63
aiq/experimental/inference_time_scaling/selection/llm_based_agent_output_selector.py +0 -131
aiq/experimental/inference_time_scaling/selection/llm_based_output_merging_selector.py +0 -159
aiq/experimental/inference_time_scaling/selection/llm_based_plan_selector.py +0 -128
aiq/experimental/inference_time_scaling/selection/threshold_selector.py +0 -58
aiq/front_ends/__init__.py +0 -14
aiq/front_ends/console/__init__.py +0 -14
aiq/front_ends/console/authentication_flow_handler.py +0 -233
aiq/front_ends/console/console_front_end_config.py +0 -32
aiq/front_ends/console/console_front_end_plugin.py +0 -96
aiq/front_ends/console/register.py +0 -25
aiq/front_ends/cron/__init__.py +0 -14
aiq/front_ends/fastapi/__init__.py +0 -14
aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +0 -27
aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +0 -107
aiq/front_ends/fastapi/fastapi_front_end_config.py +0 -234
aiq/front_ends/fastapi/fastapi_front_end_controller.py +0 -68
aiq/front_ends/fastapi/fastapi_front_end_plugin.py +0 -116
aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +0 -1092
aiq/front_ends/fastapi/html_snippets/__init__.py +0 -14
aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +0 -35
aiq/front_ends/fastapi/intermediate_steps_subscriber.py +0 -80
aiq/front_ends/fastapi/job_store.py +0 -183
aiq/front_ends/fastapi/main.py +0 -72
aiq/front_ends/fastapi/message_handler.py +0 -298
aiq/front_ends/fastapi/message_validator.py +0 -345
aiq/front_ends/fastapi/register.py +0 -25
aiq/front_ends/fastapi/response_helpers.py +0 -195
aiq/front_ends/fastapi/step_adaptor.py +0 -321
aiq/front_ends/mcp/__init__.py +0 -14
aiq/front_ends/mcp/mcp_front_end_config.py +0 -32
aiq/front_ends/mcp/mcp_front_end_plugin.py +0 -93
aiq/front_ends/mcp/register.py +0 -27
aiq/front_ends/mcp/tool_converter.py +0 -242
aiq/front_ends/register.py +0 -22
aiq/front_ends/simple_base/__init__.py +0 -14
aiq/front_ends/simple_base/simple_front_end_plugin_base.py +0 -54
aiq/llm/__init__.py +0 -0
aiq/llm/aws_bedrock_llm.py +0 -57
aiq/llm/nim_llm.py +0 -46
aiq/llm/openai_llm.py +0 -46
aiq/llm/register.py +0 -23
aiq/llm/utils/__init__.py +0 -14
aiq/llm/utils/env_config_value.py +0 -94
aiq/llm/utils/error.py +0 -17
aiq/memory/__init__.py +0 -20
aiq/memory/interfaces.py +0 -183
aiq/memory/models.py +0 -112
aiq/meta/module_to_distro.json +0 -3
aiq/meta/pypi.md +0 -58
aiq/object_store/__init__.py +0 -20
aiq/object_store/in_memory_object_store.py +0 -76
aiq/object_store/interfaces.py +0 -84
aiq/object_store/models.py +0 -36
aiq/object_store/register.py +0 -20
aiq/observability/__init__.py +0 -14
aiq/observability/exporter/__init__.py +0 -14
aiq/observability/exporter/base_exporter.py +0 -449
aiq/observability/exporter/exporter.py +0 -78
aiq/observability/exporter/file_exporter.py +0 -33
aiq/observability/exporter/processing_exporter.py +0 -322
aiq/observability/exporter/raw_exporter.py +0 -52
aiq/observability/exporter/span_exporter.py +0 -265
aiq/observability/exporter_manager.py +0 -335
aiq/observability/mixin/__init__.py +0 -14
aiq/observability/mixin/batch_config_mixin.py +0 -26
aiq/observability/mixin/collector_config_mixin.py +0 -23
aiq/observability/mixin/file_mixin.py +0 -288
aiq/observability/mixin/file_mode.py +0 -23
aiq/observability/mixin/resource_conflict_mixin.py +0 -134
aiq/observability/mixin/serialize_mixin.py +0 -61
aiq/observability/mixin/type_introspection_mixin.py +0 -183
aiq/observability/processor/__init__.py +0 -14
aiq/observability/processor/batching_processor.py +0 -309
aiq/observability/processor/callback_processor.py +0 -42
aiq/observability/processor/intermediate_step_serializer.py +0 -28
aiq/observability/processor/processor.py +0 -71
aiq/observability/register.py +0 -96
aiq/observability/utils/__init__.py +0 -14
aiq/observability/utils/dict_utils.py +0 -236
aiq/observability/utils/time_utils.py +0 -31
aiq/plugins/.namespace +0 -1
aiq/profiler/__init__.py +0 -0
aiq/profiler/calc/__init__.py +0 -14
aiq/profiler/calc/calc_runner.py +0 -627
aiq/profiler/calc/calculations.py +0 -288
aiq/profiler/calc/data_models.py +0 -188
aiq/profiler/calc/plot.py +0 -345
aiq/profiler/callbacks/__init__.py +0 -0
aiq/profiler/callbacks/agno_callback_handler.py +0 -295
aiq/profiler/callbacks/base_callback_class.py +0 -20
aiq/profiler/callbacks/langchain_callback_handler.py +0 -290
aiq/profiler/callbacks/llama_index_callback_handler.py +0 -205
aiq/profiler/callbacks/semantic_kernel_callback_handler.py +0 -238
aiq/profiler/callbacks/token_usage_base_model.py +0 -27
aiq/profiler/data_frame_row.py +0 -51
aiq/profiler/data_models.py +0 -24
aiq/profiler/decorators/__init__.py +0 -0
aiq/profiler/decorators/framework_wrapper.py +0 -131
aiq/profiler/decorators/function_tracking.py +0 -254
aiq/profiler/forecasting/__init__.py +0 -0
aiq/profiler/forecasting/config.py +0 -18
aiq/profiler/forecasting/model_trainer.py +0 -75
aiq/profiler/forecasting/models/__init__.py +0 -22
aiq/profiler/forecasting/models/forecasting_base_model.py +0 -40
aiq/profiler/forecasting/models/linear_model.py +0 -196
aiq/profiler/forecasting/models/random_forest_regressor.py +0 -268
aiq/profiler/inference_metrics_model.py +0 -28
aiq/profiler/inference_optimization/__init__.py +0 -0
aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +0 -460
aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +0 -258
aiq/profiler/inference_optimization/data_models.py +0 -386
aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +0 -468
aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +0 -405
aiq/profiler/inference_optimization/llm_metrics.py +0 -212
aiq/profiler/inference_optimization/prompt_caching.py +0 -163
aiq/profiler/inference_optimization/token_uniqueness.py +0 -107
aiq/profiler/inference_optimization/workflow_runtimes.py +0 -72
aiq/profiler/intermediate_property_adapter.py +0 -102
aiq/profiler/profile_runner.py +0 -473
aiq/profiler/utils.py +0 -184
aiq/registry_handlers/__init__.py +0 -0
aiq/registry_handlers/local/__init__.py +0 -0
aiq/registry_handlers/local/local_handler.py +0 -176
aiq/registry_handlers/local/register_local.py +0 -37
aiq/registry_handlers/metadata_factory.py +0 -60
aiq/registry_handlers/package_utils.py +0 -567
aiq/registry_handlers/pypi/__init__.py +0 -0
aiq/registry_handlers/pypi/pypi_handler.py +0 -251
aiq/registry_handlers/pypi/register_pypi.py +0 -40
aiq/registry_handlers/register.py +0 -21
aiq/registry_handlers/registry_handler_base.py +0 -157
aiq/registry_handlers/rest/__init__.py +0 -0
aiq/registry_handlers/rest/register_rest.py +0 -56
aiq/registry_handlers/rest/rest_handler.py +0 -237
aiq/registry_handlers/schemas/__init__.py +0 -0
aiq/registry_handlers/schemas/headers.py +0 -42
aiq/registry_handlers/schemas/package.py +0 -68
aiq/registry_handlers/schemas/publish.py +0 -63
aiq/registry_handlers/schemas/pull.py +0 -82
aiq/registry_handlers/schemas/remove.py +0 -36
aiq/registry_handlers/schemas/search.py +0 -91
aiq/registry_handlers/schemas/status.py +0 -47
aiq/retriever/__init__.py +0 -0
aiq/retriever/interface.py +0 -37
aiq/retriever/milvus/__init__.py +0 -14
aiq/retriever/milvus/register.py +0 -81
aiq/retriever/milvus/retriever.py +0 -228
aiq/retriever/models.py +0 -74
aiq/retriever/nemo_retriever/__init__.py +0 -14
aiq/retriever/nemo_retriever/register.py +0 -60
aiq/retriever/nemo_retriever/retriever.py +0 -190
aiq/retriever/register.py +0 -22
aiq/runtime/__init__.py +0 -14
aiq/runtime/loader.py +0 -215
aiq/runtime/runner.py +0 -190
aiq/runtime/session.py +0 -158
aiq/runtime/user_metadata.py +0 -130
aiq/settings/__init__.py +0 -0
aiq/settings/global_settings.py +0 -318
aiq/test/.namespace +0 -1
aiq/tool/__init__.py +0 -0
aiq/tool/chat_completion.py +0 -74
aiq/tool/code_execution/README.md +0 -151
aiq/tool/code_execution/__init__.py +0 -0
aiq/tool/code_execution/code_sandbox.py +0 -267
aiq/tool/code_execution/local_sandbox/.gitignore +0 -1
aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +0 -60
aiq/tool/code_execution/local_sandbox/__init__.py +0 -13
aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +0 -198
aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +0 -6
aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +0 -50
aiq/tool/code_execution/register.py +0 -74
aiq/tool/code_execution/test_code_execution_sandbox.py +0 -414
aiq/tool/code_execution/utils.py +0 -100
aiq/tool/datetime_tools.py +0 -42
aiq/tool/document_search.py +0 -141
aiq/tool/github_tools/__init__.py +0 -0
aiq/tool/github_tools/create_github_commit.py +0 -133
aiq/tool/github_tools/create_github_issue.py +0 -87
aiq/tool/github_tools/create_github_pr.py +0 -106
aiq/tool/github_tools/get_github_file.py +0 -106
aiq/tool/github_tools/get_github_issue.py +0 -166
aiq/tool/github_tools/get_github_pr.py +0 -256
aiq/tool/github_tools/update_github_issue.py +0 -100
aiq/tool/mcp/__init__.py +0 -14
aiq/tool/mcp/exceptions.py +0 -142
aiq/tool/mcp/mcp_client.py +0 -255
aiq/tool/mcp/mcp_tool.py +0 -96
aiq/tool/memory_tools/__init__.py +0 -0
aiq/tool/memory_tools/add_memory_tool.py +0 -79
aiq/tool/memory_tools/delete_memory_tool.py +0 -67
aiq/tool/memory_tools/get_memory_tool.py +0 -72
aiq/tool/nvidia_rag.py +0 -95
aiq/tool/register.py +0 -38
aiq/tool/retriever.py +0 -89
aiq/tool/server_tools.py +0 -66
aiq/utils/__init__.py +0 -0
aiq/utils/data_models/__init__.py +0 -0
aiq/utils/data_models/schema_validator.py +0 -58
aiq/utils/debugging_utils.py +0 -43
aiq/utils/dump_distro_mapping.py +0 -32
aiq/utils/exception_handlers/__init__.py +0 -0
aiq/utils/exception_handlers/automatic_retries.py +0 -289
aiq/utils/exception_handlers/mcp.py +0 -211
aiq/utils/exception_handlers/schemas.py +0 -114
aiq/utils/io/__init__.py +0 -0
aiq/utils/io/model_processing.py +0 -28
aiq/utils/io/yaml_tools.py +0 -119
aiq/utils/log_utils.py +0 -37
aiq/utils/metadata_utils.py +0 -74
aiq/utils/optional_imports.py +0 -142
aiq/utils/producer_consumer_queue.py +0 -178
aiq/utils/reactive/__init__.py +0 -0
aiq/utils/reactive/base/__init__.py +0 -0
aiq/utils/reactive/base/observable_base.py +0 -65
aiq/utils/reactive/base/observer_base.py +0 -55
aiq/utils/reactive/base/subject_base.py +0 -79
aiq/utils/reactive/observable.py +0 -59
aiq/utils/reactive/observer.py +0 -76
aiq/utils/reactive/subject.py +0 -131
aiq/utils/reactive/subscription.py +0 -49
aiq/utils/settings/__init__.py +0 -0
aiq/utils/settings/global_settings.py +0 -197
aiq/utils/string_utils.py +0 -38
aiq/utils/type_converter.py +0 -290
aiq/utils/type_utils.py +0 -484
aiq/utils/url_utils.py +0 -27
aiqtoolkit-1.2.0rc4.dist-info/METADATA +0 -363
aiqtoolkit-1.2.0rc4.dist-info/RECORD +0 -438
aiqtoolkit-1.2.0rc4.dist-info/entry_points.txt +0 -20
aiqtoolkit-1.2.0rc4.dist-info/licenses/LICENSE-3rd-party.txt +0 -3686
aiqtoolkit-1.2.0rc4.dist-info/licenses/LICENSE.md +0 -201
aiqtoolkit-1.2.0rc4.dist-info/top_level.txt +0 -1
{aiqtoolkit-1.2.0rc4.dist-info → aiqtoolkit-1.2rc9.dist-info}/WHEEL +0 -0

aiq/eval/tunable_rag_evaluator/evaluate.py DELETED Viewed

@@ -1,245 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import asyncio
-import logging
-from typing import Callable
-from langchain.output_parsers import ResponseSchema
-from langchain.output_parsers import StructuredOutputParser
-from langchain.schema import HumanMessage
-from langchain.schema import SystemMessage
-from langchain_core.language_models import BaseChatModel
-from langchain_core.runnables import RunnableLambda
-from tqdm import tqdm
-from aiq.eval.evaluator.base_evaluator import BaseEvaluator
-from aiq.eval.evaluator.evaluator_model import EvalInputItem
-from aiq.eval.evaluator.evaluator_model import EvalOutputItem
-logger = logging.getLogger(__name__)
-# pylint: disable=line-too-long
-# flake8: noqa: E501
-def evaluation_prompt(judge_llm_prompt: str,
-                      question: str,
-                      answer_description: str,
-                      generated_answer: str,
-                      format_instructions: str,
-                      default_scoring: bool):
-    """
-    This function generates a prompt for the judge LLM to evaluate the generated answer.
-    """
-    DEFAULT_SCORING_INSTRUCTIONS = """
-    The coverage score is a measure of how well the generated answer covers the critical aspects mentioned in the expected answer. A low coverage score indicates that the generated answer misses critical aspects of the expected answer. A middle coverage score indicates that the generated answer covers some of the must-haves of the expected answer but lacks other details. A high coverage score indicates that all of the expected aspects are present in the generated answer.
-    The correctness score is a measure of how well the generated answer matches the expected answer. A low correctness score indicates that the generated answer is incorrect or does not match the expected answer. A middle correctness score indicates that the generated answer is correct but lacks some details. A high correctness score indicates that the generated answer is exactly the same as the expected answer.
-    The relevance score is a measure of how well the generated answer is relevant to the question. A low relevance score indicates that the generated answer is not relevant to the question. A middle relevance score indicates that the generated answer is somewhat relevant to the question. A high relevance score indicates that the generated answer is exactly relevant to the question.
-    The reasoning is a 1-2 sentence explanation for the scoring.
-    """
-    DEFAULT_EVAL_PROMPT = (f"You are an intelligent assistant that responds strictly in JSON format."
-                           f"Judge based on the following scoring rubric: {DEFAULT_SCORING_INSTRUCTIONS}"
-                           f"{judge_llm_prompt}\n"
-                           f"{format_instructions}\n"
-                           f"Here is the user's query: {question}"
-                           f"Here is the description of the expected answer: {answer_description}"
-                           f"Here is the generated answer: {generated_answer}")
-    EVAL_PROMPT = (f"You are an intelligent assistant that responds strictly in JSON format. {judge_llm_prompt}\n"
-                   f"{format_instructions}\n"
-                   f"Here is the user's query: {question}"
-                   f"Here is the description of the expected answer: {answer_description}"
-                   f"Here is the generated answer: {generated_answer}")
-    return EVAL_PROMPT if not default_scoring else DEFAULT_EVAL_PROMPT
-def runnable_with_retries(original_fn: Callable, llm_retry_control_params: dict | None = None):
-    runnable = RunnableLambda(original_fn)
-    if llm_retry_control_params is None:
-        llm_retry_control_params = {
-            "stop_after_attempt": 3, "initial_backoff_delay_seconds": 1, "has_exponential_jitter": True
-        }
-    if llm_retry_control_params["has_exponential_jitter"] is None:
-        llm_retry_control_params["has_exponential_jitter"] = True
-    if llm_retry_control_params["stop_after_attempt"] is None:
-        llm_retry_control_params["stop_after_attempt"] = 3
-    if llm_retry_control_params["initial_backoff_delay_seconds"] is None:
-        llm_retry_control_params["initial_backoff_delay_seconds"] = 1
-    # Add retry logic with exponential backoff and jitter
-    return runnable.with_retry(
-        retry_if_exception_type=(Exception, ),  # Retry on any error
-        wait_exponential_jitter=llm_retry_control_params["has_exponential_jitter"],  # Add jitter to exponential backoff
-        stop_after_attempt=llm_retry_control_params["stop_after_attempt"],
-        exponential_jitter_params={"initial": llm_retry_control_params["initial_backoff_delay_seconds"]
-                                   }  # Optional: set initial backoff (seconds)
-    )
-class TunableRagEvaluator(BaseEvaluator):
-    '''Tunable RAG evaluator class with customizable LLM prompt for scoring.'''
-    def __init__(self,
-                 llm: BaseChatModel,
-                 judge_llm_prompt: str,
-                 llm_retry_control_params: dict | None,
-                 max_concurrency: int,
-                 default_scoring: bool,
-                 default_score_weights: dict):
-        super().__init__(max_concurrency=max_concurrency, tqdm_desc="Evaluating RAG")
-        self.llm = llm
-        self.judge_llm_prompt = judge_llm_prompt
-        self.llm_retry_control_params = llm_retry_control_params
-        self.default_scoring = default_scoring
-        # Use user-provided weights if available; otherwise, set equal weights for each score
-        self.default_score_weights = default_score_weights if default_score_weights else {
-            "coverage": 1 / 3, "correctness": 1 / 3, "relevance": 1 / 3
-        }
-    async def evaluate_item(self, item: EvalInputItem) -> EvalOutputItem:
-        """Compute RAG evaluation for an individual item and return EvalOutputItem"""
-        question = item.input_obj
-        answer_description = item.expected_output_obj
-        generated_answer = item.output_obj
-        # Call judge LLM to generate score
-        score = 0.0
-        default_evaluation_schema = [
-            ResponseSchema(
-                name="coverage_score",
-                description="Score for the coverage of all critical aspects mentioned in the expected answer. Ex. 0.5",
-                type="float"),
-            ResponseSchema(
-                name="correctness_score",
-                description="Score for the accuracy of the generated answer compared to the expected answer. Ex. 0.5",
-                type="float"),
-            ResponseSchema(name="relevance_score",
-                           description="Score for the relevance of the generated answer to the question. Ex. 0.5",
-                           type="float"),
-            ResponseSchema(
-                name="reasoning",
-                description=
-                "1-2 summarized sentences of reasoning for the scores. Ex. 'The generated answer covers all critical aspects mentioned in the expected answer, is correct, and is relevant to the question.'",
-                type="string"),
-        ]
-        custom_evaluation_schema = [
-            ResponseSchema(name="score", description="Score for the generated answer. Ex. 0.5", type="float"),
-            ResponseSchema(
-                name="reasoning",
-                description=
-                "1-2 sentence reasoning for the score. Ex. 'The generated answer is exactly the same as the description of the expected answer.'",
-                type="string"),
-        ]
-        if self.default_scoring:
-            evaluation_schema = default_evaluation_schema
-        else:
-            evaluation_schema = custom_evaluation_schema
-        llm_input_response_parser = StructuredOutputParser.from_response_schemas(evaluation_schema)
-        format_instructions = llm_input_response_parser.get_format_instructions()
-        eval_prompt = evaluation_prompt(judge_llm_prompt=self.judge_llm_prompt,
-                                        question=question,
-                                        answer_description=answer_description,
-                                        generated_answer=generated_answer,
-                                        format_instructions=format_instructions,
-                                        default_scoring=self.default_scoring)
-        messages = [SystemMessage(content="You must respond only in JSON format."), HumanMessage(content=eval_prompt)]
-        response = await runnable_with_retries(self.llm.ainvoke, self.llm_retry_control_params).ainvoke(messages)
-        # Initialize default values to handle service errors
-        coverage_score = 0.0
-        correctness_score = 0.0
-        relevance_score = 0.0
-        reasoning = "Error in evaluator from parsing judge LLM response."
-        try:
-            parsed_response = llm_input_response_parser.parse(response.content)
-            if self.default_scoring:
-                try:
-                    coverage_score = parsed_response["coverage_score"]
-                    correctness_score = parsed_response["correctness_score"]
-                    relevance_score = parsed_response["relevance_score"]
-                    reasoning = parsed_response["reasoning"]
-                except KeyError as e:
-                    logger.error("Missing required keys in default scoring response: %s",
-                                 ", ".join(str(arg) for arg in e.args))
-                    reasoning = f"Error in evaluator from parsing judge LLM response. Missing required key(s): {', '.join(str(arg) for arg in e.args)}"
-                coverage_weight = self.default_score_weights.get("coverage", 1 / 3)
-                correctness_weight = self.default_score_weights.get("correctness", 1 / 3)
-                relevance_weight = self.default_score_weights.get("relevance", 1 / 3)
-                # Calculate score
-                total_weight = coverage_weight + correctness_weight + relevance_weight
-                coverage_weight = coverage_weight / total_weight
-                correctness_weight = correctness_weight / total_weight
-                relevance_weight = relevance_weight / total_weight
-                if round(coverage_weight + correctness_weight + relevance_weight, 2) != 1:
-                    logger.warning("The sum of the default score weights is not 1. The weights will be normalized.")
-                    coverage_weight = coverage_weight / (coverage_weight + correctness_weight + relevance_weight)
-                    correctness_weight = correctness_weight / (coverage_weight + correctness_weight + relevance_weight)
-                    relevance_weight = relevance_weight / (coverage_weight + correctness_weight + relevance_weight)
-                score = (coverage_weight * coverage_score + correctness_weight * correctness_score +
-                         relevance_weight * relevance_score)
-            else:
-                try:
-                    score = parsed_response["score"]
-                    reasoning = parsed_response["reasoning"]
-                except KeyError as e:
-                    logger.error("Missing required keys in custom scoring response: %s",
-                                 ", ".join(str(arg) for arg in e.args))
-                    reasoning = f"Error in evaluator from parsing judge LLM response. Missing required key(s): {', '.join(str(arg) for arg in e.args)}"
-                    raise
-        except (KeyError, ValueError) as e:
-            logger.error("Error parsing judge LLM response: %s", e)
-            score = 0.0
-            reasoning = "Error in evaluator from parsing judge LLM response."
-        if self.default_scoring:
-            reasoning = {
-                "question": question,
-                "answer_description": answer_description,
-                "generated_answer": generated_answer,
-                "score_breakdown": {
-                    "coverage_score": coverage_score,
-                    "correctness_score": correctness_score,
-                    "relevance_score": relevance_score,
-                },
-                "reasoning": reasoning,
-            }
-        else:
-            reasoning = {
-                "question": question,
-                "answer_description": answer_description,
-                "generated_answer": generated_answer,
-                "reasoning": reasoning
-            }
-        return EvalOutputItem(id=item.id, score=score, reasoning=reasoning)

aiq/eval/tunable_rag_evaluator/register.py DELETED Viewed

@@ -1,52 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-from pydantic import Field
-from aiq.builder.builder import EvalBuilder
-from aiq.builder.evaluator import EvaluatorInfo
-from aiq.builder.framework_enum import LLMFrameworkEnum
-from aiq.cli.register_workflow import register_evaluator
-from aiq.data_models.component_ref import LLMRef
-from aiq.data_models.evaluator import EvaluatorBaseConfig
-class TunableRagEvaluatorConfig(EvaluatorBaseConfig, name="tunable_rag_evaluator"):
-    '''Configuration for tunable RAG evaluator'''
-    llm_name: LLMRef = Field(description="Name of the judge LLM")
-    llm_retry_control_params: dict | None = Field(description="Parameters to control LLM retry behavior", default=None)
-    judge_llm_prompt: str = Field(description="LLM prompt for the judge LLM")
-    default_scoring: bool = Field(description="Whether to use default scoring", default=False)
-    default_score_weights: dict = Field(
-        default={
-            "coverage": 0.5, "correctness": 0.3, "relevance": 0.2
-        },
-        description="Weights for the different scoring components when using default scoring")
-@register_evaluator(config_type=TunableRagEvaluatorConfig)
-async def register_tunable_rag_evaluator(config: TunableRagEvaluatorConfig, builder: EvalBuilder):
-    '''Register tunable RAG evaluator'''
-    from .evaluate import TunableRagEvaluator
-    llm = await builder.get_llm(config.llm_name, wrapper_type=LLMFrameworkEnum.LANGCHAIN)
-    evaluator = TunableRagEvaluator(llm,
-                                    config.judge_llm_prompt,
-                                    config.llm_retry_control_params,
-                                    builder.get_max_concurrency(),
-                                    config.default_scoring,
-                                    config.default_score_weights)
-    yield EvaluatorInfo(config=config, evaluate_fn=evaluator.evaluate, description="Tunable RAG Evaluator")

aiq/eval/usage_stats.py DELETED Viewed

@@ -1,41 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import typing
-from pydantic import BaseModel
-class UsageStatsLLM(BaseModel):
-    prompt_tokens: int = 0
-    completion_tokens: int = 0
-    total_tokens: int = 0
-class UsageStatsItem(BaseModel):
-    usage_stats_per_llm: dict[str, UsageStatsLLM]
-    total_tokens: int | None = None
-    runtime: float = 0.0
-    min_timestamp: float = 0.0
-    max_timestamp: float = 0.0
-    llm_latency: float = 0.0
-class UsageStats(BaseModel):
-    # key is the id or input_obj from EvalInputItem
-    min_timestamp: float = 0.0
-    max_timestamp: float = 0.0
-    total_runtime: float = 0.0
-    usage_stats_items: dict[typing.Any, UsageStatsItem] = {}

aiq/eval/utils/__init__.py DELETED Viewed

File without changes

aiq/eval/utils/output_uploader.py DELETED Viewed

@@ -1,140 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-import asyncio
-import logging
-import os
-import subprocess
-import sys
-from pathlib import Path
-import aioboto3
-from botocore.exceptions import NoCredentialsError
-from tqdm import tqdm
-from aiq.data_models.evaluate import EvalOutputConfig
-logger = logging.getLogger(__name__)
-class OutputUploader:
-    """
-    Run custom scripts and upload evaluation outputs using the configured s3
-    credentials.
-    """
-    def __init__(self, output_config: EvalOutputConfig, job_id: str | None = None):
-        self.output_config = output_config
-        self._s3_client = None
-        self.job_id = job_id
-    @property
-    def s3_config(self):
-        return self.output_config.s3
-    async def _upload_file(self, s3_client, bucket, s3_key, local_path, pbar):
-        try:
-            await s3_client.upload_file(str(local_path), bucket, s3_key)
-            logger.info("Uploaded %s to s3://%s/%s", local_path, bucket, s3_key)
-            pbar.update(1)
-        except Exception as e:
-            logger.error("Failed to upload %s to s3://%s/%s: %s", local_path, bucket, s3_key, e)
-            raise
-    async def upload_directory(self):
-        """
-        Upload the contents of the local output directory to the remote S3 bucket in parallel.
-        """
-        if not self.output_config.s3:
-            logger.info("No S3 config provided; skipping upload.")
-            return
-        local_dir = self.output_config.dir
-        bucket = self.s3_config.bucket
-        remote_prefix = self.output_config.remote_dir or ""
-        if self.job_id:
-            remote_prefix = str(Path(remote_prefix) / f"jobs/{self.job_id}")
-        file_entries = []
-        for root, _, files in os.walk(local_dir):
-            for file in files:
-                local_path = Path(root) / file
-                relative_path = local_path.relative_to(local_dir)
-                s3_path = Path(remote_prefix) / relative_path
-                s3_key = str(s3_path).replace("\\", "/")  # Normalize for S3
-                file_entries.append((local_path, s3_key))
-        session = aioboto3.Session()
-        try:
-            if self.s3_config.endpoint_url:
-                region_name = None
-                endpoint_url = self.s3_config.endpoint_url
-            elif self.s3_config.region_name:
-                region_name = self.s3_config.region_name
-                endpoint_url = None
-            else:
-                raise ValueError("No endpoint_url or region_name provided in the config: eval.general.output.s3")
-            async with session.client(
-                    "s3",
-                    endpoint_url=endpoint_url,
-                    region_name=region_name,
-                    aws_access_key_id=self.s3_config.access_key,
-                    aws_secret_access_key=self.s3_config.secret_key,
-            ) as s3_client:
-                with tqdm(total=len(file_entries), desc="Uploading files to S3") as pbar:
-                    upload_tasks = [
-                        self._upload_file(s3_client, bucket, s3_key, local_path, pbar)
-                        for local_path, s3_key in file_entries
-                    ]
-                    await asyncio.gather(*upload_tasks)
-        except NoCredentialsError as e:
-            logger.error("AWS credentials not available: %s", e)
-            raise
-        except Exception as e:
-            logger.error("Failed to upload files to S3: %s", e)
-            raise
-    def run_custom_scripts(self):
-        """
-        Run custom Python scripts defined in the EvalOutputConfig.
-        Each script is run with its kwargs passed as command-line arguments.
-        The output directory is passed as the first argument.
-        """
-        for _, script_config in self.output_config.custom_scripts.items():
-            script_path = script_config.script
-            if not script_path.exists():
-                logger.error("Custom script %s does not exist.", script_path)
-                continue
-            # use python interpreter
-            args = [sys.executable, str(script_path)]
-            # add output directory as first keyword argument
-            args.append("--output_dir")
-            args.append(str(self.output_config.dir))
-            if script_config.kwargs:
-                for key, value in script_config.kwargs.items():
-                    args.append(f"--{key}")
-                    args.append(str(value))
-            display_args = " ".join(f'"{arg}"' if " " in arg else arg for arg in args[1:])
-            try:
-                logger.info("Running custom script: %s %s", script_path, display_args)
-                subprocess.run(args, check=True, text=True)
-                logger.info("Custom script %s completed successfully.", script_path)
-            except subprocess.CalledProcessError as e:
-                logger.error("Custom script %s failed with return code %s", script_path, e.returncode)
-                raise

aiq/eval/utils/tqdm_position_registry.py DELETED Viewed

@@ -1,40 +0,0 @@
-# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
-# SPDX-License-Identifier: Apache-2.0
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-class TqdmPositionRegistry:
-    """
-    A simple registry for tqdm positions.
-    """
-    _positions = set()
-    _max_positions = 100
-    @classmethod
-    def claim(cls) -> int:
-        """
-        Claim a tqdm position in the range of 0-99.
-        """
-        for i in range(cls._max_positions):
-            if i not in cls._positions:
-                cls._positions.add(i)
-                return i
-        raise RuntimeError("No available tqdm positions.")
-    @classmethod
-    def release(cls, pos: int):
-        """
-        Release a tqdm position.
-        """
-        cls._positions.discard(pos)

aiqtoolkit 1.2.0rc4__py3-none-any.whl → 1.2rc9__py3-none-any.whl

Potentially problematic release.

aiqtoolkit 1.2.0rc4py3-none-any.whl → 1.2rc9py3-none-any.whl