aiqtoolkit 1.2.0rc3__py3-none-any.whl → 1.2.0rc5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of aiqtoolkit might be problematic. Click here for more details.

Files changed (440) hide show
  1. aiqtoolkit-1.2.0rc5.dist-info/METADATA +29 -0
  2. aiqtoolkit-1.2.0rc5.dist-info/RECORD +4 -0
  3. aiqtoolkit-1.2.0rc5.dist-info/top_level.txt +1 -0
  4. aiq/agent/__init__.py +0 -0
  5. aiq/agent/base.py +0 -239
  6. aiq/agent/dual_node.py +0 -67
  7. aiq/agent/react_agent/__init__.py +0 -0
  8. aiq/agent/react_agent/agent.py +0 -355
  9. aiq/agent/react_agent/output_parser.py +0 -104
  10. aiq/agent/react_agent/prompt.py +0 -41
  11. aiq/agent/react_agent/register.py +0 -149
  12. aiq/agent/reasoning_agent/__init__.py +0 -0
  13. aiq/agent/reasoning_agent/reasoning_agent.py +0 -225
  14. aiq/agent/register.py +0 -23
  15. aiq/agent/rewoo_agent/__init__.py +0 -0
  16. aiq/agent/rewoo_agent/agent.py +0 -411
  17. aiq/agent/rewoo_agent/prompt.py +0 -108
  18. aiq/agent/rewoo_agent/register.py +0 -158
  19. aiq/agent/tool_calling_agent/__init__.py +0 -0
  20. aiq/agent/tool_calling_agent/agent.py +0 -119
  21. aiq/agent/tool_calling_agent/register.py +0 -106
  22. aiq/authentication/__init__.py +0 -14
  23. aiq/authentication/api_key/__init__.py +0 -14
  24. aiq/authentication/api_key/api_key_auth_provider.py +0 -92
  25. aiq/authentication/api_key/api_key_auth_provider_config.py +0 -124
  26. aiq/authentication/api_key/register.py +0 -26
  27. aiq/authentication/exceptions/__init__.py +0 -14
  28. aiq/authentication/exceptions/api_key_exceptions.py +0 -38
  29. aiq/authentication/exceptions/auth_code_grant_exceptions.py +0 -86
  30. aiq/authentication/exceptions/call_back_exceptions.py +0 -38
  31. aiq/authentication/exceptions/request_exceptions.py +0 -54
  32. aiq/authentication/http_basic_auth/__init__.py +0 -0
  33. aiq/authentication/http_basic_auth/http_basic_auth_provider.py +0 -81
  34. aiq/authentication/http_basic_auth/register.py +0 -30
  35. aiq/authentication/interfaces.py +0 -93
  36. aiq/authentication/oauth2/__init__.py +0 -14
  37. aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +0 -107
  38. aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +0 -39
  39. aiq/authentication/oauth2/register.py +0 -25
  40. aiq/authentication/register.py +0 -21
  41. aiq/builder/__init__.py +0 -0
  42. aiq/builder/builder.py +0 -285
  43. aiq/builder/component_utils.py +0 -316
  44. aiq/builder/context.py +0 -264
  45. aiq/builder/embedder.py +0 -24
  46. aiq/builder/eval_builder.py +0 -161
  47. aiq/builder/evaluator.py +0 -29
  48. aiq/builder/framework_enum.py +0 -24
  49. aiq/builder/front_end.py +0 -73
  50. aiq/builder/function.py +0 -344
  51. aiq/builder/function_base.py +0 -380
  52. aiq/builder/function_info.py +0 -627
  53. aiq/builder/intermediate_step_manager.py +0 -174
  54. aiq/builder/llm.py +0 -25
  55. aiq/builder/retriever.py +0 -25
  56. aiq/builder/user_interaction_manager.py +0 -74
  57. aiq/builder/workflow.py +0 -148
  58. aiq/builder/workflow_builder.py +0 -1117
  59. aiq/cli/__init__.py +0 -14
  60. aiq/cli/cli_utils/__init__.py +0 -0
  61. aiq/cli/cli_utils/config_override.py +0 -231
  62. aiq/cli/cli_utils/validation.py +0 -37
  63. aiq/cli/commands/__init__.py +0 -0
  64. aiq/cli/commands/configure/__init__.py +0 -0
  65. aiq/cli/commands/configure/channel/__init__.py +0 -0
  66. aiq/cli/commands/configure/channel/add.py +0 -28
  67. aiq/cli/commands/configure/channel/channel.py +0 -36
  68. aiq/cli/commands/configure/channel/remove.py +0 -30
  69. aiq/cli/commands/configure/channel/update.py +0 -30
  70. aiq/cli/commands/configure/configure.py +0 -33
  71. aiq/cli/commands/evaluate.py +0 -139
  72. aiq/cli/commands/info/__init__.py +0 -14
  73. aiq/cli/commands/info/info.py +0 -39
  74. aiq/cli/commands/info/list_channels.py +0 -32
  75. aiq/cli/commands/info/list_components.py +0 -129
  76. aiq/cli/commands/info/list_mcp.py +0 -213
  77. aiq/cli/commands/registry/__init__.py +0 -14
  78. aiq/cli/commands/registry/publish.py +0 -88
  79. aiq/cli/commands/registry/pull.py +0 -118
  80. aiq/cli/commands/registry/registry.py +0 -38
  81. aiq/cli/commands/registry/remove.py +0 -108
  82. aiq/cli/commands/registry/search.py +0 -155
  83. aiq/cli/commands/sizing/__init__.py +0 -14
  84. aiq/cli/commands/sizing/calc.py +0 -297
  85. aiq/cli/commands/sizing/sizing.py +0 -27
  86. aiq/cli/commands/start.py +0 -246
  87. aiq/cli/commands/uninstall.py +0 -81
  88. aiq/cli/commands/validate.py +0 -47
  89. aiq/cli/commands/workflow/__init__.py +0 -14
  90. aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
  91. aiq/cli/commands/workflow/templates/config.yml.j2 +0 -16
  92. aiq/cli/commands/workflow/templates/pyproject.toml.j2 +0 -22
  93. aiq/cli/commands/workflow/templates/register.py.j2 +0 -5
  94. aiq/cli/commands/workflow/templates/workflow.py.j2 +0 -36
  95. aiq/cli/commands/workflow/workflow.py +0 -37
  96. aiq/cli/commands/workflow/workflow_commands.py +0 -313
  97. aiq/cli/entrypoint.py +0 -135
  98. aiq/cli/main.py +0 -44
  99. aiq/cli/register_workflow.py +0 -488
  100. aiq/cli/type_registry.py +0 -1000
  101. aiq/data_models/__init__.py +0 -14
  102. aiq/data_models/api_server.py +0 -694
  103. aiq/data_models/authentication.py +0 -231
  104. aiq/data_models/common.py +0 -171
  105. aiq/data_models/component.py +0 -54
  106. aiq/data_models/component_ref.py +0 -168
  107. aiq/data_models/config.py +0 -406
  108. aiq/data_models/dataset_handler.py +0 -123
  109. aiq/data_models/discovery_metadata.py +0 -286
  110. aiq/data_models/embedder.py +0 -27
  111. aiq/data_models/evaluate.py +0 -127
  112. aiq/data_models/evaluator.py +0 -26
  113. aiq/data_models/front_end.py +0 -26
  114. aiq/data_models/function.py +0 -30
  115. aiq/data_models/function_dependencies.py +0 -72
  116. aiq/data_models/interactive.py +0 -246
  117. aiq/data_models/intermediate_step.py +0 -302
  118. aiq/data_models/invocation_node.py +0 -38
  119. aiq/data_models/its_strategy.py +0 -30
  120. aiq/data_models/llm.py +0 -27
  121. aiq/data_models/logging.py +0 -26
  122. aiq/data_models/memory.py +0 -27
  123. aiq/data_models/object_store.py +0 -44
  124. aiq/data_models/profiler.py +0 -54
  125. aiq/data_models/registry_handler.py +0 -26
  126. aiq/data_models/retriever.py +0 -30
  127. aiq/data_models/retry_mixin.py +0 -35
  128. aiq/data_models/span.py +0 -187
  129. aiq/data_models/step_adaptor.py +0 -64
  130. aiq/data_models/streaming.py +0 -33
  131. aiq/data_models/swe_bench_model.py +0 -54
  132. aiq/data_models/telemetry_exporter.py +0 -26
  133. aiq/embedder/__init__.py +0 -0
  134. aiq/embedder/langchain_client.py +0 -41
  135. aiq/embedder/nim_embedder.py +0 -59
  136. aiq/embedder/openai_embedder.py +0 -43
  137. aiq/embedder/register.py +0 -24
  138. aiq/eval/__init__.py +0 -14
  139. aiq/eval/config.py +0 -60
  140. aiq/eval/dataset_handler/__init__.py +0 -0
  141. aiq/eval/dataset_handler/dataset_downloader.py +0 -106
  142. aiq/eval/dataset_handler/dataset_filter.py +0 -52
  143. aiq/eval/dataset_handler/dataset_handler.py +0 -254
  144. aiq/eval/evaluate.py +0 -506
  145. aiq/eval/evaluator/__init__.py +0 -14
  146. aiq/eval/evaluator/base_evaluator.py +0 -73
  147. aiq/eval/evaluator/evaluator_model.py +0 -45
  148. aiq/eval/intermediate_step_adapter.py +0 -99
  149. aiq/eval/rag_evaluator/__init__.py +0 -0
  150. aiq/eval/rag_evaluator/evaluate.py +0 -178
  151. aiq/eval/rag_evaluator/register.py +0 -143
  152. aiq/eval/register.py +0 -23
  153. aiq/eval/remote_workflow.py +0 -133
  154. aiq/eval/runners/__init__.py +0 -14
  155. aiq/eval/runners/config.py +0 -39
  156. aiq/eval/runners/multi_eval_runner.py +0 -54
  157. aiq/eval/runtime_event_subscriber.py +0 -52
  158. aiq/eval/swe_bench_evaluator/__init__.py +0 -0
  159. aiq/eval/swe_bench_evaluator/evaluate.py +0 -215
  160. aiq/eval/swe_bench_evaluator/register.py +0 -36
  161. aiq/eval/trajectory_evaluator/__init__.py +0 -0
  162. aiq/eval/trajectory_evaluator/evaluate.py +0 -75
  163. aiq/eval/trajectory_evaluator/register.py +0 -40
  164. aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
  165. aiq/eval/tunable_rag_evaluator/evaluate.py +0 -245
  166. aiq/eval/tunable_rag_evaluator/register.py +0 -52
  167. aiq/eval/usage_stats.py +0 -41
  168. aiq/eval/utils/__init__.py +0 -0
  169. aiq/eval/utils/output_uploader.py +0 -140
  170. aiq/eval/utils/tqdm_position_registry.py +0 -40
  171. aiq/eval/utils/weave_eval.py +0 -184
  172. aiq/experimental/__init__.py +0 -0
  173. aiq/experimental/decorators/__init__.py +0 -0
  174. aiq/experimental/decorators/experimental_warning_decorator.py +0 -130
  175. aiq/experimental/inference_time_scaling/__init__.py +0 -0
  176. aiq/experimental/inference_time_scaling/editing/__init__.py +0 -0
  177. aiq/experimental/inference_time_scaling/editing/iterative_plan_refinement_editor.py +0 -147
  178. aiq/experimental/inference_time_scaling/editing/llm_as_a_judge_editor.py +0 -204
  179. aiq/experimental/inference_time_scaling/editing/motivation_aware_summarization.py +0 -107
  180. aiq/experimental/inference_time_scaling/functions/__init__.py +0 -0
  181. aiq/experimental/inference_time_scaling/functions/execute_score_select_function.py +0 -105
  182. aiq/experimental/inference_time_scaling/functions/its_tool_orchestration_function.py +0 -205
  183. aiq/experimental/inference_time_scaling/functions/its_tool_wrapper_function.py +0 -146
  184. aiq/experimental/inference_time_scaling/functions/plan_select_execute_function.py +0 -224
  185. aiq/experimental/inference_time_scaling/models/__init__.py +0 -0
  186. aiq/experimental/inference_time_scaling/models/editor_config.py +0 -132
  187. aiq/experimental/inference_time_scaling/models/its_item.py +0 -48
  188. aiq/experimental/inference_time_scaling/models/scoring_config.py +0 -112
  189. aiq/experimental/inference_time_scaling/models/search_config.py +0 -120
  190. aiq/experimental/inference_time_scaling/models/selection_config.py +0 -154
  191. aiq/experimental/inference_time_scaling/models/stage_enums.py +0 -43
  192. aiq/experimental/inference_time_scaling/models/strategy_base.py +0 -66
  193. aiq/experimental/inference_time_scaling/models/tool_use_config.py +0 -41
  194. aiq/experimental/inference_time_scaling/register.py +0 -36
  195. aiq/experimental/inference_time_scaling/scoring/__init__.py +0 -0
  196. aiq/experimental/inference_time_scaling/scoring/llm_based_agent_scorer.py +0 -168
  197. aiq/experimental/inference_time_scaling/scoring/llm_based_plan_scorer.py +0 -168
  198. aiq/experimental/inference_time_scaling/scoring/motivation_aware_scorer.py +0 -111
  199. aiq/experimental/inference_time_scaling/search/__init__.py +0 -0
  200. aiq/experimental/inference_time_scaling/search/multi_llm_planner.py +0 -128
  201. aiq/experimental/inference_time_scaling/search/multi_query_retrieval_search.py +0 -122
  202. aiq/experimental/inference_time_scaling/search/single_shot_multi_plan_planner.py +0 -128
  203. aiq/experimental/inference_time_scaling/selection/__init__.py +0 -0
  204. aiq/experimental/inference_time_scaling/selection/best_of_n_selector.py +0 -63
  205. aiq/experimental/inference_time_scaling/selection/llm_based_agent_output_selector.py +0 -131
  206. aiq/experimental/inference_time_scaling/selection/llm_based_output_merging_selector.py +0 -159
  207. aiq/experimental/inference_time_scaling/selection/llm_based_plan_selector.py +0 -128
  208. aiq/experimental/inference_time_scaling/selection/threshold_selector.py +0 -58
  209. aiq/front_ends/__init__.py +0 -14
  210. aiq/front_ends/console/__init__.py +0 -14
  211. aiq/front_ends/console/authentication_flow_handler.py +0 -233
  212. aiq/front_ends/console/console_front_end_config.py +0 -32
  213. aiq/front_ends/console/console_front_end_plugin.py +0 -96
  214. aiq/front_ends/console/register.py +0 -25
  215. aiq/front_ends/cron/__init__.py +0 -14
  216. aiq/front_ends/fastapi/__init__.py +0 -14
  217. aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
  218. aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +0 -27
  219. aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +0 -107
  220. aiq/front_ends/fastapi/fastapi_front_end_config.py +0 -234
  221. aiq/front_ends/fastapi/fastapi_front_end_controller.py +0 -68
  222. aiq/front_ends/fastapi/fastapi_front_end_plugin.py +0 -116
  223. aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +0 -1092
  224. aiq/front_ends/fastapi/html_snippets/__init__.py +0 -14
  225. aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +0 -35
  226. aiq/front_ends/fastapi/intermediate_steps_subscriber.py +0 -80
  227. aiq/front_ends/fastapi/job_store.py +0 -183
  228. aiq/front_ends/fastapi/main.py +0 -72
  229. aiq/front_ends/fastapi/message_handler.py +0 -298
  230. aiq/front_ends/fastapi/message_validator.py +0 -345
  231. aiq/front_ends/fastapi/register.py +0 -25
  232. aiq/front_ends/fastapi/response_helpers.py +0 -195
  233. aiq/front_ends/fastapi/step_adaptor.py +0 -321
  234. aiq/front_ends/mcp/__init__.py +0 -14
  235. aiq/front_ends/mcp/mcp_front_end_config.py +0 -32
  236. aiq/front_ends/mcp/mcp_front_end_plugin.py +0 -93
  237. aiq/front_ends/mcp/register.py +0 -27
  238. aiq/front_ends/mcp/tool_converter.py +0 -242
  239. aiq/front_ends/register.py +0 -22
  240. aiq/front_ends/simple_base/__init__.py +0 -14
  241. aiq/front_ends/simple_base/simple_front_end_plugin_base.py +0 -54
  242. aiq/llm/__init__.py +0 -0
  243. aiq/llm/aws_bedrock_llm.py +0 -57
  244. aiq/llm/nim_llm.py +0 -46
  245. aiq/llm/openai_llm.py +0 -46
  246. aiq/llm/register.py +0 -23
  247. aiq/llm/utils/__init__.py +0 -14
  248. aiq/llm/utils/env_config_value.py +0 -94
  249. aiq/llm/utils/error.py +0 -17
  250. aiq/memory/__init__.py +0 -20
  251. aiq/memory/interfaces.py +0 -183
  252. aiq/memory/models.py +0 -112
  253. aiq/meta/module_to_distro.json +0 -3
  254. aiq/meta/pypi.md +0 -58
  255. aiq/object_store/__init__.py +0 -20
  256. aiq/object_store/in_memory_object_store.py +0 -74
  257. aiq/object_store/interfaces.py +0 -84
  258. aiq/object_store/models.py +0 -36
  259. aiq/object_store/register.py +0 -20
  260. aiq/observability/__init__.py +0 -14
  261. aiq/observability/exporter/__init__.py +0 -14
  262. aiq/observability/exporter/base_exporter.py +0 -449
  263. aiq/observability/exporter/exporter.py +0 -78
  264. aiq/observability/exporter/file_exporter.py +0 -33
  265. aiq/observability/exporter/processing_exporter.py +0 -322
  266. aiq/observability/exporter/raw_exporter.py +0 -52
  267. aiq/observability/exporter/span_exporter.py +0 -265
  268. aiq/observability/exporter_manager.py +0 -335
  269. aiq/observability/mixin/__init__.py +0 -14
  270. aiq/observability/mixin/batch_config_mixin.py +0 -26
  271. aiq/observability/mixin/collector_config_mixin.py +0 -23
  272. aiq/observability/mixin/file_mixin.py +0 -288
  273. aiq/observability/mixin/file_mode.py +0 -23
  274. aiq/observability/mixin/resource_conflict_mixin.py +0 -134
  275. aiq/observability/mixin/serialize_mixin.py +0 -61
  276. aiq/observability/mixin/type_introspection_mixin.py +0 -183
  277. aiq/observability/processor/__init__.py +0 -14
  278. aiq/observability/processor/batching_processor.py +0 -309
  279. aiq/observability/processor/callback_processor.py +0 -42
  280. aiq/observability/processor/intermediate_step_serializer.py +0 -28
  281. aiq/observability/processor/processor.py +0 -71
  282. aiq/observability/register.py +0 -96
  283. aiq/observability/utils/__init__.py +0 -14
  284. aiq/observability/utils/dict_utils.py +0 -236
  285. aiq/observability/utils/time_utils.py +0 -31
  286. aiq/plugins/.namespace +0 -1
  287. aiq/profiler/__init__.py +0 -0
  288. aiq/profiler/calc/__init__.py +0 -14
  289. aiq/profiler/calc/calc_runner.py +0 -627
  290. aiq/profiler/calc/calculations.py +0 -288
  291. aiq/profiler/calc/data_models.py +0 -188
  292. aiq/profiler/calc/plot.py +0 -345
  293. aiq/profiler/callbacks/__init__.py +0 -0
  294. aiq/profiler/callbacks/agno_callback_handler.py +0 -295
  295. aiq/profiler/callbacks/base_callback_class.py +0 -20
  296. aiq/profiler/callbacks/langchain_callback_handler.py +0 -290
  297. aiq/profiler/callbacks/llama_index_callback_handler.py +0 -205
  298. aiq/profiler/callbacks/semantic_kernel_callback_handler.py +0 -238
  299. aiq/profiler/callbacks/token_usage_base_model.py +0 -27
  300. aiq/profiler/data_frame_row.py +0 -51
  301. aiq/profiler/data_models.py +0 -24
  302. aiq/profiler/decorators/__init__.py +0 -0
  303. aiq/profiler/decorators/framework_wrapper.py +0 -131
  304. aiq/profiler/decorators/function_tracking.py +0 -254
  305. aiq/profiler/forecasting/__init__.py +0 -0
  306. aiq/profiler/forecasting/config.py +0 -18
  307. aiq/profiler/forecasting/model_trainer.py +0 -75
  308. aiq/profiler/forecasting/models/__init__.py +0 -22
  309. aiq/profiler/forecasting/models/forecasting_base_model.py +0 -40
  310. aiq/profiler/forecasting/models/linear_model.py +0 -196
  311. aiq/profiler/forecasting/models/random_forest_regressor.py +0 -268
  312. aiq/profiler/inference_metrics_model.py +0 -28
  313. aiq/profiler/inference_optimization/__init__.py +0 -0
  314. aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
  315. aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +0 -460
  316. aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +0 -258
  317. aiq/profiler/inference_optimization/data_models.py +0 -386
  318. aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
  319. aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +0 -468
  320. aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +0 -405
  321. aiq/profiler/inference_optimization/llm_metrics.py +0 -212
  322. aiq/profiler/inference_optimization/prompt_caching.py +0 -163
  323. aiq/profiler/inference_optimization/token_uniqueness.py +0 -107
  324. aiq/profiler/inference_optimization/workflow_runtimes.py +0 -72
  325. aiq/profiler/intermediate_property_adapter.py +0 -102
  326. aiq/profiler/profile_runner.py +0 -473
  327. aiq/profiler/utils.py +0 -184
  328. aiq/registry_handlers/__init__.py +0 -0
  329. aiq/registry_handlers/local/__init__.py +0 -0
  330. aiq/registry_handlers/local/local_handler.py +0 -176
  331. aiq/registry_handlers/local/register_local.py +0 -37
  332. aiq/registry_handlers/metadata_factory.py +0 -60
  333. aiq/registry_handlers/package_utils.py +0 -198
  334. aiq/registry_handlers/pypi/__init__.py +0 -0
  335. aiq/registry_handlers/pypi/pypi_handler.py +0 -251
  336. aiq/registry_handlers/pypi/register_pypi.py +0 -40
  337. aiq/registry_handlers/register.py +0 -21
  338. aiq/registry_handlers/registry_handler_base.py +0 -157
  339. aiq/registry_handlers/rest/__init__.py +0 -0
  340. aiq/registry_handlers/rest/register_rest.py +0 -56
  341. aiq/registry_handlers/rest/rest_handler.py +0 -237
  342. aiq/registry_handlers/schemas/__init__.py +0 -0
  343. aiq/registry_handlers/schemas/headers.py +0 -42
  344. aiq/registry_handlers/schemas/package.py +0 -68
  345. aiq/registry_handlers/schemas/publish.py +0 -63
  346. aiq/registry_handlers/schemas/pull.py +0 -82
  347. aiq/registry_handlers/schemas/remove.py +0 -36
  348. aiq/registry_handlers/schemas/search.py +0 -91
  349. aiq/registry_handlers/schemas/status.py +0 -47
  350. aiq/retriever/__init__.py +0 -0
  351. aiq/retriever/interface.py +0 -37
  352. aiq/retriever/milvus/__init__.py +0 -14
  353. aiq/retriever/milvus/register.py +0 -81
  354. aiq/retriever/milvus/retriever.py +0 -228
  355. aiq/retriever/models.py +0 -74
  356. aiq/retriever/nemo_retriever/__init__.py +0 -14
  357. aiq/retriever/nemo_retriever/register.py +0 -60
  358. aiq/retriever/nemo_retriever/retriever.py +0 -190
  359. aiq/retriever/register.py +0 -22
  360. aiq/runtime/__init__.py +0 -14
  361. aiq/runtime/loader.py +0 -194
  362. aiq/runtime/runner.py +0 -190
  363. aiq/runtime/session.py +0 -158
  364. aiq/runtime/user_metadata.py +0 -130
  365. aiq/settings/__init__.py +0 -0
  366. aiq/settings/global_settings.py +0 -318
  367. aiq/test/.namespace +0 -1
  368. aiq/tool/__init__.py +0 -0
  369. aiq/tool/chat_completion.py +0 -74
  370. aiq/tool/code_execution/README.md +0 -152
  371. aiq/tool/code_execution/__init__.py +0 -0
  372. aiq/tool/code_execution/code_sandbox.py +0 -267
  373. aiq/tool/code_execution/local_sandbox/.gitignore +0 -1
  374. aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +0 -60
  375. aiq/tool/code_execution/local_sandbox/__init__.py +0 -13
  376. aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +0 -198
  377. aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +0 -6
  378. aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +0 -50
  379. aiq/tool/code_execution/register.py +0 -74
  380. aiq/tool/code_execution/test_code_execution_sandbox.py +0 -414
  381. aiq/tool/code_execution/utils.py +0 -100
  382. aiq/tool/datetime_tools.py +0 -42
  383. aiq/tool/document_search.py +0 -141
  384. aiq/tool/github_tools/__init__.py +0 -0
  385. aiq/tool/github_tools/create_github_commit.py +0 -133
  386. aiq/tool/github_tools/create_github_issue.py +0 -87
  387. aiq/tool/github_tools/create_github_pr.py +0 -106
  388. aiq/tool/github_tools/get_github_file.py +0 -106
  389. aiq/tool/github_tools/get_github_issue.py +0 -166
  390. aiq/tool/github_tools/get_github_pr.py +0 -256
  391. aiq/tool/github_tools/update_github_issue.py +0 -100
  392. aiq/tool/mcp/__init__.py +0 -14
  393. aiq/tool/mcp/exceptions.py +0 -142
  394. aiq/tool/mcp/mcp_client.py +0 -255
  395. aiq/tool/mcp/mcp_tool.py +0 -96
  396. aiq/tool/memory_tools/__init__.py +0 -0
  397. aiq/tool/memory_tools/add_memory_tool.py +0 -79
  398. aiq/tool/memory_tools/delete_memory_tool.py +0 -67
  399. aiq/tool/memory_tools/get_memory_tool.py +0 -72
  400. aiq/tool/nvidia_rag.py +0 -95
  401. aiq/tool/register.py +0 -38
  402. aiq/tool/retriever.py +0 -89
  403. aiq/tool/server_tools.py +0 -66
  404. aiq/utils/__init__.py +0 -0
  405. aiq/utils/data_models/__init__.py +0 -0
  406. aiq/utils/data_models/schema_validator.py +0 -58
  407. aiq/utils/debugging_utils.py +0 -43
  408. aiq/utils/exception_handlers/__init__.py +0 -0
  409. aiq/utils/exception_handlers/automatic_retries.py +0 -289
  410. aiq/utils/exception_handlers/mcp.py +0 -211
  411. aiq/utils/exception_handlers/schemas.py +0 -114
  412. aiq/utils/io/__init__.py +0 -0
  413. aiq/utils/io/model_processing.py +0 -28
  414. aiq/utils/io/yaml_tools.py +0 -119
  415. aiq/utils/log_utils.py +0 -37
  416. aiq/utils/metadata_utils.py +0 -74
  417. aiq/utils/optional_imports.py +0 -142
  418. aiq/utils/producer_consumer_queue.py +0 -178
  419. aiq/utils/reactive/__init__.py +0 -0
  420. aiq/utils/reactive/base/__init__.py +0 -0
  421. aiq/utils/reactive/base/observable_base.py +0 -65
  422. aiq/utils/reactive/base/observer_base.py +0 -55
  423. aiq/utils/reactive/base/subject_base.py +0 -79
  424. aiq/utils/reactive/observable.py +0 -59
  425. aiq/utils/reactive/observer.py +0 -76
  426. aiq/utils/reactive/subject.py +0 -131
  427. aiq/utils/reactive/subscription.py +0 -49
  428. aiq/utils/settings/__init__.py +0 -0
  429. aiq/utils/settings/global_settings.py +0 -197
  430. aiq/utils/string_utils.py +0 -38
  431. aiq/utils/type_converter.py +0 -290
  432. aiq/utils/type_utils.py +0 -484
  433. aiq/utils/url_utils.py +0 -27
  434. aiqtoolkit-1.2.0rc3.dist-info/METADATA +0 -363
  435. aiqtoolkit-1.2.0rc3.dist-info/RECORD +0 -437
  436. aiqtoolkit-1.2.0rc3.dist-info/entry_points.txt +0 -20
  437. aiqtoolkit-1.2.0rc3.dist-info/licenses/LICENSE-3rd-party.txt +0 -3686
  438. aiqtoolkit-1.2.0rc3.dist-info/licenses/LICENSE.md +0 -201
  439. aiqtoolkit-1.2.0rc3.dist-info/top_level.txt +0 -1
  440. {aiqtoolkit-1.2.0rc3.dist-info → aiqtoolkit-1.2.0rc5.dist-info}/WHEEL +0 -0
@@ -1,468 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
15
- """
16
- An enhanced script that:
17
-
18
- 1. Groups workflow events by example_number to build a per-example call tree (no cross-example nesting).
19
- 2. Tracks concurrency globally across *all* examples.
20
- 3. Identifies concurrency "spikes" (concurrency >= a threshold).
21
- 4. Correlates concurrency spikes with token usage and call metadata.
22
- 5. Computes average call latency by concurrency level, using midpoint concurrency as an approximation.
23
- 6. Returns a Pydantic result containing concurrency distribution, spike intervals, correlation stats, etc.,
24
- along with a textual report containing the real call count, active calls in spikes, etc.
25
-
26
- Changes from previous version:
27
-
28
- - Now shows the actual total calls in the dataset.
29
- - Displays the real number of active calls for each spike interval.
30
- - Computes and reports average latency by concurrency (no visualization).
31
-
32
- """
33
-
34
- import numpy as np
35
- import pandas as pd
36
-
37
- from aiq.data_models.intermediate_step import IntermediateStep
38
- from aiq.profiler.inference_optimization.data_models import ConcurrencyAnalysisResult
39
- from aiq.profiler.inference_optimization.data_models import ConcurrencyCallNode
40
- from aiq.profiler.inference_optimization.data_models import ConcurrencyCorrelationStats
41
- from aiq.profiler.inference_optimization.data_models import ConcurrencySpikeInfo
42
- from aiq.profiler.utils import create_standardized_dataframe
43
-
44
- # --------------------------------------------------------------------------------
45
- # 1) Building the Per-Example Call Trees
46
- # --------------------------------------------------------------------------------
47
-
48
-
49
- def build_call_tree_for_example(example_df: pd.DataFrame) -> list[ConcurrencyCallNode]:
50
- """
51
- Sort events by time, push on `*_START`, pop on `*_END`, build stack-based calls for a single example.
52
- """
53
- stack: list[ConcurrencyCallNode] = []
54
- top_level: dict[str, ConcurrencyCallNode] = {}
55
- partial_map: dict[str, ConcurrencyCallNode] = {}
56
-
57
- def parse_op_type(et: str) -> str | None:
58
- et = et.upper()
59
- if et.startswith("LLM_"):
60
- return "LLM"
61
- if et.startswith("TOOL_"):
62
- return "TOOL"
63
- return None
64
-
65
- def get_op_name(row: pd.Series, op_type: str) -> str:
66
- if op_type == "LLM":
67
- return row.get("llm_name") or "unknown_llm"
68
- if op_type == "TOOL":
69
- return row.get("tool_name") or "unknown_tool"
70
- return "unknown_op"
71
-
72
- example_num = int(example_df["example_number"].iloc[0])
73
-
74
- for _, row in example_df.iterrows():
75
- et = row["event_type"].value.upper()
76
- uuid = str(row["UUID"])
77
- ts = float(row["event_timestamp"])
78
- op_type = parse_op_type(et)
79
- if not op_type:
80
- continue
81
-
82
- if et.endswith("_START"):
83
- op_name = get_op_name(row, op_type)
84
- node = ConcurrencyCallNode(
85
- uuid=uuid,
86
- example_number=example_num,
87
- operation_type=op_type,
88
- operation_name=op_name,
89
- start_time=ts,
90
- end_time=ts, # updated on END
91
- duration=0.0)
92
- if stack:
93
- parent = stack[-1]
94
- node.parent = parent
95
- parent.children.append(node)
96
- else:
97
- top_level[uuid] = node
98
-
99
- stack.append(node)
100
- partial_map[uuid] = node
101
-
102
- elif et.endswith("_END"):
103
- if uuid not in partial_map:
104
- continue
105
- node = partial_map[uuid]
106
- node.end_time = ts
107
- node.duration = max(0.0, node.end_time - node.start_time)
108
- node.prompt_tokens = row.get("prompt_tokens")
109
- node.completion_tokens = row.get("completion_tokens")
110
- node.total_tokens = row.get("total_tokens")
111
- node.tool_outputs = row.get("metadata").get("tool_outputs") if (
112
- row.get("metadata") and row.get("metadata").get("tool_outputs")) else None
113
- node.llm_text_output = row.get("llm_text_output")
114
-
115
- if stack and stack[-1].uuid == uuid:
116
- stack.pop()
117
- del partial_map[uuid]
118
-
119
- # gather top-level
120
- roots = []
121
- for _, nd in top_level.items():
122
- if nd.parent is None:
123
- roots.append(nd)
124
- return roots
125
-
126
-
127
- def build_call_tree_per_example(df: pd.DataFrame) -> list[ConcurrencyCallNode]:
128
- """
129
- Groups by example_number, builds separate call trees, returns combined list of top-level calls.
130
- """
131
- req_cols = {"example_number", "event_type", "UUID", "event_timestamp"}
132
- missing = req_cols - set(df.columns)
133
- if missing:
134
- raise ValueError(f"DataFrame missing required columns: {missing}")
135
-
136
- dfc = df.copy()
137
- dfc.sort_values(["example_number", "event_timestamp"], inplace=True)
138
-
139
- all_roots: list[ConcurrencyCallNode] = []
140
- for _, grp in dfc.groupby("example_number"):
141
- r = build_call_tree_for_example(grp)
142
- all_roots.extend(r)
143
- return all_roots
144
-
145
-
146
- def flatten_calls(roots: list[ConcurrencyCallNode]) -> list[ConcurrencyCallNode]:
147
- """
148
- DFS to produce a flat list of all calls (including nested).
149
- """
150
- all_nodes = []
151
-
152
- def dfs(n: ConcurrencyCallNode):
153
- all_nodes.append(n)
154
- for c in n.children:
155
- dfs(c)
156
-
157
- for rt in roots:
158
- dfs(rt)
159
- return all_nodes
160
-
161
-
162
- # --------------------------------------------------------------------------------
163
- # 2) Global Concurrency Distribution & Segments
164
- # --------------------------------------------------------------------------------
165
-
166
-
167
- def compute_concurrency_distribution(roots: list[ConcurrencyCallNode]) -> dict[int, float]:
168
- """
169
- Flatten calls, produce (start, +1)/(end, -1), accumulate total time at each concurrency level.
170
- """
171
- all_nodes = flatten_calls(roots)
172
- if not all_nodes:
173
- return {}
174
-
175
- events = []
176
- for n in all_nodes:
177
- if n.start_time <= n.end_time:
178
- events.append((n.start_time, +1))
179
- events.append((n.end_time, -1))
180
-
181
- events.sort(key=lambda x: x[0])
182
- dist_map: dict[int, float] = {}
183
- curr_conc = 0
184
- prev_time = events[0][0]
185
-
186
- for (time_val, delta) in events:
187
- if time_val > prev_time:
188
- length = time_val - prev_time
189
- dist_map[curr_conc] = dist_map.get(curr_conc, 0.0) + length
190
- curr_conc += delta
191
- prev_time = time_val
192
-
193
- return dist_map
194
-
195
-
196
- def build_concurrency_segments(roots: list[ConcurrencyCallNode]) -> list[tuple[float, float, int]]:
197
- """
198
- Return piecewise segments of (start, end, concurrency) across all calls.
199
- """
200
- all_nodes = flatten_calls(roots)
201
- if not all_nodes:
202
- return []
203
-
204
- events = []
205
- for n in all_nodes:
206
- if n.start_time <= n.end_time:
207
- events.append((n.start_time, +1))
208
- events.append((n.end_time, -1))
209
-
210
- events.sort(key=lambda x: x[0])
211
- segments: list[tuple[float, float, int]] = []
212
- curr_conc = 0
213
- prev_time = events[0][0]
214
-
215
- for (t, delta) in events:
216
- if t > prev_time:
217
- segments.append((prev_time, t, curr_conc))
218
- curr_conc += delta
219
- prev_time = t
220
-
221
- return segments
222
-
223
-
224
- def find_percentile_concurrency(dist_map: dict[int, float], percentile: float) -> float:
225
- """
226
- concurrency => total_time -> find concurrency level at given percentile of total time.
227
- """
228
- total_time = sum(dist_map.values())
229
- if total_time <= 0:
230
- return 0.0
231
-
232
- items = sorted(dist_map.items(), key=lambda x: x[0]) # ascending concurrency
233
- threshold = percentile * 0.01 * total_time
234
- accum = 0.0
235
- last_c = 0
236
-
237
- for c_val, dur in items:
238
- accum += dur
239
- if accum >= threshold:
240
- return float(c_val)
241
- last_c = c_val
242
- return float(last_c)
243
-
244
-
245
- # --------------------------------------------------------------------------------
246
- # 3) Spike Detection & Active Calls
247
- # --------------------------------------------------------------------------------
248
-
249
-
250
- def detect_concurrency_spikes(segments: list[tuple[float, float, int]], threshold: int) -> list[ConcurrencySpikeInfo]:
251
- """
252
- If concurrency >= threshold, label that segment a 'spike'.
253
- """
254
- spikes = []
255
- for (s, e, c_val) in segments:
256
- if c_val >= threshold and e > s:
257
- sp = ConcurrencySpikeInfo(start_time=s, end_time=e, concurrency=c_val)
258
- spikes.append(sp)
259
- return spikes
260
-
261
-
262
- def find_calls_active_in_interval(roots: list[ConcurrencyCallNode], start_t: float,
263
- end_t: float) -> list[ConcurrencyCallNode]:
264
- """
265
- Return all calls overlapping [start_t, end_t).
266
- Overlap => not (call.end_time <= start_t or call.start_time >= end_t).
267
- """
268
- results = []
269
- all_nodes = flatten_calls(roots)
270
- for n in all_nodes:
271
- if not (n.end_time <= start_t or n.start_time >= end_t):
272
- results.append(n)
273
- return results
274
-
275
-
276
- # --------------------------------------------------------------------------------
277
- # 4) Correlations & Average Latency by Concurrency
278
- # --------------------------------------------------------------------------------
279
-
280
- def correlate_spike_calls(spikes: list[ConcurrencySpikeInfo], roots: list[ConcurrencyCallNode]) \
281
- -> ConcurrencyCorrelationStats:
282
- """
283
- For each spike, gather calls that overlap, compute average prompt_tokens, total_tokens across them.
284
- """
285
- p_tokens = []
286
- t_tokens = []
287
-
288
- for sp in spikes:
289
- active = find_calls_active_in_interval(roots, sp.start_time, sp.end_time)
290
- # record the active call uuids for each spike
291
- sp.active_uuids = list({c.uuid for c in active})
292
-
293
- for c in active:
294
- if c.prompt_tokens and c.prompt_tokens > 0:
295
- p_tokens.append(c.prompt_tokens)
296
- if c.total_tokens and c.total_tokens > 0:
297
- t_tokens.append(c.total_tokens)
298
-
299
- def safe_avg(lst):
300
- return float(np.mean(lst)) if lst else 0.0
301
-
302
- return ConcurrencyCorrelationStats(
303
- avg_prompt_tokens=safe_avg(p_tokens),
304
- avg_total_tokens=safe_avg(t_tokens),
305
- )
306
-
307
-
308
- def compute_midpoint_concurrency(n: ConcurrencyCallNode, segments: list[tuple[float, float, int]]) -> float:
309
- """
310
- Approx concurrency at the midpoint of this call.
311
- """
312
- if n.start_time >= n.end_time:
313
- return 0.0
314
- mid = 0.5 * (n.start_time + n.end_time)
315
-
316
- # binary or linear search
317
- left, right = 0, len(segments) - 1
318
- while left <= right:
319
- mid_idx = (left + right) // 2
320
- seg_start, seg_end, seg_conc = segments[mid_idx]
321
- if seg_start <= mid < seg_end:
322
- return float(seg_conc)
323
- if mid < seg_start:
324
- right = mid_idx - 1
325
- else:
326
- left = mid_idx + 1
327
- return 0.0
328
-
329
-
330
- def average_latency_by_midpoint_concurrency(roots: list[ConcurrencyCallNode]) -> dict[int, float]:
331
- """
332
- For each call, find concurrency at midpoint, then bucket durations by concurrency, compute avg.
333
- """
334
- segs = build_concurrency_segments(roots)
335
- all_nodes = flatten_calls(roots)
336
-
337
- # concurrency => list of durations
338
- from collections import defaultdict
339
- calls_by_conc = defaultdict(list)
340
-
341
- for c in all_nodes:
342
- mc = compute_midpoint_concurrency(c, segs)
343
- # round or cast to int
344
- c_level = int(mc)
345
- calls_by_conc[c_level].append(c.duration)
346
-
347
- result = {}
348
- for c_level, durations in calls_by_conc.items():
349
- if durations:
350
- result[c_level] = float(np.mean(durations))
351
- else:
352
- result[c_level] = 0.0
353
- return result
354
-
355
-
356
- # --------------------------------------------------------------------------------
357
- # 5) Main Analysis Function
358
- # --------------------------------------------------------------------------------
359
-
360
-
361
- def concurrency_spike_analysis(
362
- all_steps: list[list[IntermediateStep]],
363
- concurrency_spike_threshold: int | None = None,
364
- ) -> ConcurrencyAnalysisResult:
365
- """
366
- 1) Build per-example call trees (no cross-example nesting).
367
- 2) Compute concurrency distribution & concurrency segments across *all* calls.
368
- 3) Derive concurrency percentiles (p50, p90, p95, p99).
369
- 4) If threshold not provided, pick e.g. ceil of p90 concurrency.
370
- 5) Detect spikes, gather calls in those intervals => correlation stats.
371
- 6) Also compute average latency by concurrency and add to report.
372
- 7) Return a Pydantic object with everything, plus a textual report.
373
- """
374
- df = create_standardized_dataframe(all_steps)
375
- required_cols = {
376
- "framework",
377
- "llm_name",
378
- "llm_text_input",
379
- "llm_text_output",
380
- "event_timestamp",
381
- "event_type",
382
- "UUID",
383
- "example_number",
384
- "prompt_tokens",
385
- "completion_tokens",
386
- "total_tokens"
387
- }
388
- missing = required_cols - set(df.columns)
389
- if missing:
390
- raise ValueError(f"DataFrame missing required columns: {missing}")
391
-
392
- # Build global forest
393
- roots = build_call_tree_per_example(df)
394
- all_calls = flatten_calls(roots)
395
- num_calls = len(all_calls)
396
-
397
- # Concurrency distribution
398
- dist_map = compute_concurrency_distribution(roots)
399
- total_time = sum(dist_map.values())
400
-
401
- p50_c = find_percentile_concurrency(dist_map, 50)
402
- p90_c = find_percentile_concurrency(dist_map, 90)
403
- p95_c = find_percentile_concurrency(dist_map, 95)
404
- p99_c = find_percentile_concurrency(dist_map, 99)
405
-
406
- # Threshold
407
- if concurrency_spike_threshold is None:
408
- concurrency_spike_threshold = max(1, int(np.ceil(p90_c)))
409
-
410
- # Build concurrency segments, detect spikes
411
- segments = build_concurrency_segments(roots)
412
- spike_intervals = detect_concurrency_spikes(segments, concurrency_spike_threshold)
413
-
414
- # Correlate
415
- corr_stats = correlate_spike_calls(spike_intervals, roots)
416
-
417
- # Average latency by concurrency
418
- avg_lat_by_conc = average_latency_by_midpoint_concurrency(roots)
419
-
420
- # Build textual report
421
- lines = []
422
- lines.append("=== Concurrency Spike Analysis ===")
423
- lines.append(f"Total calls in dataset: {num_calls}")
424
- lines.append(f"Total time observed: {total_time:.2f} units (sum of concurrency timeline)")
425
-
426
- lines.append("\n-- Concurrency Distribution --")
427
- for c_val in sorted(dist_map.keys()):
428
- dur = dist_map[c_val]
429
- lines.append(f" concurrency={c_val}: {dur:.2f} time")
430
-
431
- lines.append(f"\nPercentiles => p50={p50_c:.1f}, p90={p90_c:.1f}, p95={p95_c:.1f}, p99={p99_c:.1f}")
432
- lines.append(f"Spike threshold chosen: {concurrency_spike_threshold}")
433
-
434
- lines.append("\n-- Detected Spike Intervals --")
435
- if not spike_intervals:
436
- lines.append("No intervals exceed concurrency spike threshold.")
437
- else:
438
- for i, sp in enumerate(spike_intervals, start=1):
439
- length = sp.end_time - sp.start_time
440
- active_count = len(sp.active_uuids)
441
- lines.append(f"{i}) {sp.start_time:.2f}-{sp.end_time:.2f}, concurrency={sp.concurrency}, "
442
- f"length={length:.2f}, #active_calls={active_count}")
443
-
444
- lines.append("\n-- Correlation Stats for Spiked Calls --")
445
- lines.append(f"Avg prompt_tokens in spike calls: {corr_stats.avg_prompt_tokens:.1f}")
446
- lines.append(f"Avg total_tokens in spike calls : {corr_stats.avg_total_tokens:.1f}")
447
-
448
- lines.append("\n-- Average Latency by Midpoint Concurrency --")
449
- if not avg_lat_by_conc:
450
- lines.append("No calls or no concurrency data.")
451
- else:
452
- for c_level in sorted(avg_lat_by_conc.keys()):
453
- lat = avg_lat_by_conc[c_level]
454
- lines.append(f" concurrency={c_level} => avg_latency={lat:.2f}")
455
-
456
- final_report = "\n".join(lines)
457
-
458
- # Build result object
459
- return ConcurrencyAnalysisResult(concurrency_distribution=dist_map,
460
- p50_concurrency=p50_c,
461
- p90_concurrency=p90_c,
462
- p95_concurrency=p95_c,
463
- p99_concurrency=p99_c,
464
- spike_threshold=concurrency_spike_threshold,
465
- spike_intervals=spike_intervals,
466
- correlation_stats=corr_stats,
467
- textual_report=final_report,
468
- average_latency_by_concurrency=avg_lat_by_conc)