aiqtoolkit 1.2.0rc4__py3-none-any.whl → 1.2rc9__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of aiqtoolkit might be problematic. Click here for more details.

Files changed (441) hide show
  1. aiqtoolkit-1.2rc9.dist-info/METADATA +29 -0
  2. aiqtoolkit-1.2rc9.dist-info/RECORD +4 -0
  3. aiqtoolkit-1.2rc9.dist-info/top_level.txt +1 -0
  4. aiq/agent/__init__.py +0 -0
  5. aiq/agent/base.py +0 -239
  6. aiq/agent/dual_node.py +0 -67
  7. aiq/agent/react_agent/__init__.py +0 -0
  8. aiq/agent/react_agent/agent.py +0 -355
  9. aiq/agent/react_agent/output_parser.py +0 -104
  10. aiq/agent/react_agent/prompt.py +0 -41
  11. aiq/agent/react_agent/register.py +0 -149
  12. aiq/agent/reasoning_agent/__init__.py +0 -0
  13. aiq/agent/reasoning_agent/reasoning_agent.py +0 -225
  14. aiq/agent/register.py +0 -23
  15. aiq/agent/rewoo_agent/__init__.py +0 -0
  16. aiq/agent/rewoo_agent/agent.py +0 -411
  17. aiq/agent/rewoo_agent/prompt.py +0 -108
  18. aiq/agent/rewoo_agent/register.py +0 -158
  19. aiq/agent/tool_calling_agent/__init__.py +0 -0
  20. aiq/agent/tool_calling_agent/agent.py +0 -119
  21. aiq/agent/tool_calling_agent/register.py +0 -106
  22. aiq/authentication/__init__.py +0 -14
  23. aiq/authentication/api_key/__init__.py +0 -14
  24. aiq/authentication/api_key/api_key_auth_provider.py +0 -96
  25. aiq/authentication/api_key/api_key_auth_provider_config.py +0 -124
  26. aiq/authentication/api_key/register.py +0 -26
  27. aiq/authentication/exceptions/__init__.py +0 -14
  28. aiq/authentication/exceptions/api_key_exceptions.py +0 -38
  29. aiq/authentication/exceptions/auth_code_grant_exceptions.py +0 -86
  30. aiq/authentication/exceptions/call_back_exceptions.py +0 -38
  31. aiq/authentication/exceptions/request_exceptions.py +0 -54
  32. aiq/authentication/http_basic_auth/__init__.py +0 -0
  33. aiq/authentication/http_basic_auth/http_basic_auth_provider.py +0 -81
  34. aiq/authentication/http_basic_auth/register.py +0 -30
  35. aiq/authentication/interfaces.py +0 -93
  36. aiq/authentication/oauth2/__init__.py +0 -14
  37. aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +0 -107
  38. aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +0 -39
  39. aiq/authentication/oauth2/register.py +0 -25
  40. aiq/authentication/register.py +0 -21
  41. aiq/builder/__init__.py +0 -0
  42. aiq/builder/builder.py +0 -285
  43. aiq/builder/component_utils.py +0 -316
  44. aiq/builder/context.py +0 -264
  45. aiq/builder/embedder.py +0 -24
  46. aiq/builder/eval_builder.py +0 -161
  47. aiq/builder/evaluator.py +0 -29
  48. aiq/builder/framework_enum.py +0 -24
  49. aiq/builder/front_end.py +0 -73
  50. aiq/builder/function.py +0 -344
  51. aiq/builder/function_base.py +0 -380
  52. aiq/builder/function_info.py +0 -627
  53. aiq/builder/intermediate_step_manager.py +0 -174
  54. aiq/builder/llm.py +0 -25
  55. aiq/builder/retriever.py +0 -25
  56. aiq/builder/user_interaction_manager.py +0 -74
  57. aiq/builder/workflow.py +0 -148
  58. aiq/builder/workflow_builder.py +0 -1117
  59. aiq/cli/__init__.py +0 -14
  60. aiq/cli/cli_utils/__init__.py +0 -0
  61. aiq/cli/cli_utils/config_override.py +0 -231
  62. aiq/cli/cli_utils/validation.py +0 -37
  63. aiq/cli/commands/__init__.py +0 -0
  64. aiq/cli/commands/configure/__init__.py +0 -0
  65. aiq/cli/commands/configure/channel/__init__.py +0 -0
  66. aiq/cli/commands/configure/channel/add.py +0 -28
  67. aiq/cli/commands/configure/channel/channel.py +0 -36
  68. aiq/cli/commands/configure/channel/remove.py +0 -30
  69. aiq/cli/commands/configure/channel/update.py +0 -30
  70. aiq/cli/commands/configure/configure.py +0 -33
  71. aiq/cli/commands/evaluate.py +0 -139
  72. aiq/cli/commands/info/__init__.py +0 -14
  73. aiq/cli/commands/info/info.py +0 -39
  74. aiq/cli/commands/info/list_channels.py +0 -32
  75. aiq/cli/commands/info/list_components.py +0 -129
  76. aiq/cli/commands/info/list_mcp.py +0 -213
  77. aiq/cli/commands/registry/__init__.py +0 -14
  78. aiq/cli/commands/registry/publish.py +0 -88
  79. aiq/cli/commands/registry/pull.py +0 -118
  80. aiq/cli/commands/registry/registry.py +0 -38
  81. aiq/cli/commands/registry/remove.py +0 -108
  82. aiq/cli/commands/registry/search.py +0 -155
  83. aiq/cli/commands/sizing/__init__.py +0 -14
  84. aiq/cli/commands/sizing/calc.py +0 -297
  85. aiq/cli/commands/sizing/sizing.py +0 -27
  86. aiq/cli/commands/start.py +0 -246
  87. aiq/cli/commands/uninstall.py +0 -81
  88. aiq/cli/commands/validate.py +0 -47
  89. aiq/cli/commands/workflow/__init__.py +0 -14
  90. aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
  91. aiq/cli/commands/workflow/templates/config.yml.j2 +0 -16
  92. aiq/cli/commands/workflow/templates/pyproject.toml.j2 +0 -22
  93. aiq/cli/commands/workflow/templates/register.py.j2 +0 -5
  94. aiq/cli/commands/workflow/templates/workflow.py.j2 +0 -36
  95. aiq/cli/commands/workflow/workflow.py +0 -37
  96. aiq/cli/commands/workflow/workflow_commands.py +0 -313
  97. aiq/cli/entrypoint.py +0 -135
  98. aiq/cli/main.py +0 -44
  99. aiq/cli/register_workflow.py +0 -488
  100. aiq/cli/type_registry.py +0 -1000
  101. aiq/data_models/__init__.py +0 -14
  102. aiq/data_models/api_server.py +0 -694
  103. aiq/data_models/authentication.py +0 -231
  104. aiq/data_models/common.py +0 -171
  105. aiq/data_models/component.py +0 -54
  106. aiq/data_models/component_ref.py +0 -168
  107. aiq/data_models/config.py +0 -406
  108. aiq/data_models/dataset_handler.py +0 -123
  109. aiq/data_models/discovery_metadata.py +0 -335
  110. aiq/data_models/embedder.py +0 -27
  111. aiq/data_models/evaluate.py +0 -127
  112. aiq/data_models/evaluator.py +0 -26
  113. aiq/data_models/front_end.py +0 -26
  114. aiq/data_models/function.py +0 -30
  115. aiq/data_models/function_dependencies.py +0 -72
  116. aiq/data_models/interactive.py +0 -246
  117. aiq/data_models/intermediate_step.py +0 -302
  118. aiq/data_models/invocation_node.py +0 -38
  119. aiq/data_models/its_strategy.py +0 -30
  120. aiq/data_models/llm.py +0 -27
  121. aiq/data_models/logging.py +0 -26
  122. aiq/data_models/memory.py +0 -27
  123. aiq/data_models/object_store.py +0 -44
  124. aiq/data_models/profiler.py +0 -54
  125. aiq/data_models/registry_handler.py +0 -26
  126. aiq/data_models/retriever.py +0 -30
  127. aiq/data_models/retry_mixin.py +0 -35
  128. aiq/data_models/span.py +0 -187
  129. aiq/data_models/step_adaptor.py +0 -64
  130. aiq/data_models/streaming.py +0 -33
  131. aiq/data_models/swe_bench_model.py +0 -54
  132. aiq/data_models/telemetry_exporter.py +0 -26
  133. aiq/embedder/__init__.py +0 -0
  134. aiq/embedder/langchain_client.py +0 -41
  135. aiq/embedder/nim_embedder.py +0 -59
  136. aiq/embedder/openai_embedder.py +0 -43
  137. aiq/embedder/register.py +0 -24
  138. aiq/eval/__init__.py +0 -14
  139. aiq/eval/config.py +0 -60
  140. aiq/eval/dataset_handler/__init__.py +0 -0
  141. aiq/eval/dataset_handler/dataset_downloader.py +0 -106
  142. aiq/eval/dataset_handler/dataset_filter.py +0 -52
  143. aiq/eval/dataset_handler/dataset_handler.py +0 -254
  144. aiq/eval/evaluate.py +0 -506
  145. aiq/eval/evaluator/__init__.py +0 -14
  146. aiq/eval/evaluator/base_evaluator.py +0 -73
  147. aiq/eval/evaluator/evaluator_model.py +0 -45
  148. aiq/eval/intermediate_step_adapter.py +0 -99
  149. aiq/eval/rag_evaluator/__init__.py +0 -0
  150. aiq/eval/rag_evaluator/evaluate.py +0 -178
  151. aiq/eval/rag_evaluator/register.py +0 -143
  152. aiq/eval/register.py +0 -23
  153. aiq/eval/remote_workflow.py +0 -133
  154. aiq/eval/runners/__init__.py +0 -14
  155. aiq/eval/runners/config.py +0 -39
  156. aiq/eval/runners/multi_eval_runner.py +0 -54
  157. aiq/eval/runtime_event_subscriber.py +0 -52
  158. aiq/eval/swe_bench_evaluator/__init__.py +0 -0
  159. aiq/eval/swe_bench_evaluator/evaluate.py +0 -215
  160. aiq/eval/swe_bench_evaluator/register.py +0 -36
  161. aiq/eval/trajectory_evaluator/__init__.py +0 -0
  162. aiq/eval/trajectory_evaluator/evaluate.py +0 -75
  163. aiq/eval/trajectory_evaluator/register.py +0 -40
  164. aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
  165. aiq/eval/tunable_rag_evaluator/evaluate.py +0 -245
  166. aiq/eval/tunable_rag_evaluator/register.py +0 -52
  167. aiq/eval/usage_stats.py +0 -41
  168. aiq/eval/utils/__init__.py +0 -0
  169. aiq/eval/utils/output_uploader.py +0 -140
  170. aiq/eval/utils/tqdm_position_registry.py +0 -40
  171. aiq/eval/utils/weave_eval.py +0 -184
  172. aiq/experimental/__init__.py +0 -0
  173. aiq/experimental/decorators/__init__.py +0 -0
  174. aiq/experimental/decorators/experimental_warning_decorator.py +0 -130
  175. aiq/experimental/inference_time_scaling/__init__.py +0 -0
  176. aiq/experimental/inference_time_scaling/editing/__init__.py +0 -0
  177. aiq/experimental/inference_time_scaling/editing/iterative_plan_refinement_editor.py +0 -147
  178. aiq/experimental/inference_time_scaling/editing/llm_as_a_judge_editor.py +0 -204
  179. aiq/experimental/inference_time_scaling/editing/motivation_aware_summarization.py +0 -107
  180. aiq/experimental/inference_time_scaling/functions/__init__.py +0 -0
  181. aiq/experimental/inference_time_scaling/functions/execute_score_select_function.py +0 -105
  182. aiq/experimental/inference_time_scaling/functions/its_tool_orchestration_function.py +0 -205
  183. aiq/experimental/inference_time_scaling/functions/its_tool_wrapper_function.py +0 -146
  184. aiq/experimental/inference_time_scaling/functions/plan_select_execute_function.py +0 -224
  185. aiq/experimental/inference_time_scaling/models/__init__.py +0 -0
  186. aiq/experimental/inference_time_scaling/models/editor_config.py +0 -132
  187. aiq/experimental/inference_time_scaling/models/its_item.py +0 -48
  188. aiq/experimental/inference_time_scaling/models/scoring_config.py +0 -112
  189. aiq/experimental/inference_time_scaling/models/search_config.py +0 -120
  190. aiq/experimental/inference_time_scaling/models/selection_config.py +0 -154
  191. aiq/experimental/inference_time_scaling/models/stage_enums.py +0 -43
  192. aiq/experimental/inference_time_scaling/models/strategy_base.py +0 -66
  193. aiq/experimental/inference_time_scaling/models/tool_use_config.py +0 -41
  194. aiq/experimental/inference_time_scaling/register.py +0 -36
  195. aiq/experimental/inference_time_scaling/scoring/__init__.py +0 -0
  196. aiq/experimental/inference_time_scaling/scoring/llm_based_agent_scorer.py +0 -168
  197. aiq/experimental/inference_time_scaling/scoring/llm_based_plan_scorer.py +0 -168
  198. aiq/experimental/inference_time_scaling/scoring/motivation_aware_scorer.py +0 -111
  199. aiq/experimental/inference_time_scaling/search/__init__.py +0 -0
  200. aiq/experimental/inference_time_scaling/search/multi_llm_planner.py +0 -128
  201. aiq/experimental/inference_time_scaling/search/multi_query_retrieval_search.py +0 -122
  202. aiq/experimental/inference_time_scaling/search/single_shot_multi_plan_planner.py +0 -128
  203. aiq/experimental/inference_time_scaling/selection/__init__.py +0 -0
  204. aiq/experimental/inference_time_scaling/selection/best_of_n_selector.py +0 -63
  205. aiq/experimental/inference_time_scaling/selection/llm_based_agent_output_selector.py +0 -131
  206. aiq/experimental/inference_time_scaling/selection/llm_based_output_merging_selector.py +0 -159
  207. aiq/experimental/inference_time_scaling/selection/llm_based_plan_selector.py +0 -128
  208. aiq/experimental/inference_time_scaling/selection/threshold_selector.py +0 -58
  209. aiq/front_ends/__init__.py +0 -14
  210. aiq/front_ends/console/__init__.py +0 -14
  211. aiq/front_ends/console/authentication_flow_handler.py +0 -233
  212. aiq/front_ends/console/console_front_end_config.py +0 -32
  213. aiq/front_ends/console/console_front_end_plugin.py +0 -96
  214. aiq/front_ends/console/register.py +0 -25
  215. aiq/front_ends/cron/__init__.py +0 -14
  216. aiq/front_ends/fastapi/__init__.py +0 -14
  217. aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
  218. aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +0 -27
  219. aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +0 -107
  220. aiq/front_ends/fastapi/fastapi_front_end_config.py +0 -234
  221. aiq/front_ends/fastapi/fastapi_front_end_controller.py +0 -68
  222. aiq/front_ends/fastapi/fastapi_front_end_plugin.py +0 -116
  223. aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +0 -1092
  224. aiq/front_ends/fastapi/html_snippets/__init__.py +0 -14
  225. aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +0 -35
  226. aiq/front_ends/fastapi/intermediate_steps_subscriber.py +0 -80
  227. aiq/front_ends/fastapi/job_store.py +0 -183
  228. aiq/front_ends/fastapi/main.py +0 -72
  229. aiq/front_ends/fastapi/message_handler.py +0 -298
  230. aiq/front_ends/fastapi/message_validator.py +0 -345
  231. aiq/front_ends/fastapi/register.py +0 -25
  232. aiq/front_ends/fastapi/response_helpers.py +0 -195
  233. aiq/front_ends/fastapi/step_adaptor.py +0 -321
  234. aiq/front_ends/mcp/__init__.py +0 -14
  235. aiq/front_ends/mcp/mcp_front_end_config.py +0 -32
  236. aiq/front_ends/mcp/mcp_front_end_plugin.py +0 -93
  237. aiq/front_ends/mcp/register.py +0 -27
  238. aiq/front_ends/mcp/tool_converter.py +0 -242
  239. aiq/front_ends/register.py +0 -22
  240. aiq/front_ends/simple_base/__init__.py +0 -14
  241. aiq/front_ends/simple_base/simple_front_end_plugin_base.py +0 -54
  242. aiq/llm/__init__.py +0 -0
  243. aiq/llm/aws_bedrock_llm.py +0 -57
  244. aiq/llm/nim_llm.py +0 -46
  245. aiq/llm/openai_llm.py +0 -46
  246. aiq/llm/register.py +0 -23
  247. aiq/llm/utils/__init__.py +0 -14
  248. aiq/llm/utils/env_config_value.py +0 -94
  249. aiq/llm/utils/error.py +0 -17
  250. aiq/memory/__init__.py +0 -20
  251. aiq/memory/interfaces.py +0 -183
  252. aiq/memory/models.py +0 -112
  253. aiq/meta/module_to_distro.json +0 -3
  254. aiq/meta/pypi.md +0 -58
  255. aiq/object_store/__init__.py +0 -20
  256. aiq/object_store/in_memory_object_store.py +0 -76
  257. aiq/object_store/interfaces.py +0 -84
  258. aiq/object_store/models.py +0 -36
  259. aiq/object_store/register.py +0 -20
  260. aiq/observability/__init__.py +0 -14
  261. aiq/observability/exporter/__init__.py +0 -14
  262. aiq/observability/exporter/base_exporter.py +0 -449
  263. aiq/observability/exporter/exporter.py +0 -78
  264. aiq/observability/exporter/file_exporter.py +0 -33
  265. aiq/observability/exporter/processing_exporter.py +0 -322
  266. aiq/observability/exporter/raw_exporter.py +0 -52
  267. aiq/observability/exporter/span_exporter.py +0 -265
  268. aiq/observability/exporter_manager.py +0 -335
  269. aiq/observability/mixin/__init__.py +0 -14
  270. aiq/observability/mixin/batch_config_mixin.py +0 -26
  271. aiq/observability/mixin/collector_config_mixin.py +0 -23
  272. aiq/observability/mixin/file_mixin.py +0 -288
  273. aiq/observability/mixin/file_mode.py +0 -23
  274. aiq/observability/mixin/resource_conflict_mixin.py +0 -134
  275. aiq/observability/mixin/serialize_mixin.py +0 -61
  276. aiq/observability/mixin/type_introspection_mixin.py +0 -183
  277. aiq/observability/processor/__init__.py +0 -14
  278. aiq/observability/processor/batching_processor.py +0 -309
  279. aiq/observability/processor/callback_processor.py +0 -42
  280. aiq/observability/processor/intermediate_step_serializer.py +0 -28
  281. aiq/observability/processor/processor.py +0 -71
  282. aiq/observability/register.py +0 -96
  283. aiq/observability/utils/__init__.py +0 -14
  284. aiq/observability/utils/dict_utils.py +0 -236
  285. aiq/observability/utils/time_utils.py +0 -31
  286. aiq/plugins/.namespace +0 -1
  287. aiq/profiler/__init__.py +0 -0
  288. aiq/profiler/calc/__init__.py +0 -14
  289. aiq/profiler/calc/calc_runner.py +0 -627
  290. aiq/profiler/calc/calculations.py +0 -288
  291. aiq/profiler/calc/data_models.py +0 -188
  292. aiq/profiler/calc/plot.py +0 -345
  293. aiq/profiler/callbacks/__init__.py +0 -0
  294. aiq/profiler/callbacks/agno_callback_handler.py +0 -295
  295. aiq/profiler/callbacks/base_callback_class.py +0 -20
  296. aiq/profiler/callbacks/langchain_callback_handler.py +0 -290
  297. aiq/profiler/callbacks/llama_index_callback_handler.py +0 -205
  298. aiq/profiler/callbacks/semantic_kernel_callback_handler.py +0 -238
  299. aiq/profiler/callbacks/token_usage_base_model.py +0 -27
  300. aiq/profiler/data_frame_row.py +0 -51
  301. aiq/profiler/data_models.py +0 -24
  302. aiq/profiler/decorators/__init__.py +0 -0
  303. aiq/profiler/decorators/framework_wrapper.py +0 -131
  304. aiq/profiler/decorators/function_tracking.py +0 -254
  305. aiq/profiler/forecasting/__init__.py +0 -0
  306. aiq/profiler/forecasting/config.py +0 -18
  307. aiq/profiler/forecasting/model_trainer.py +0 -75
  308. aiq/profiler/forecasting/models/__init__.py +0 -22
  309. aiq/profiler/forecasting/models/forecasting_base_model.py +0 -40
  310. aiq/profiler/forecasting/models/linear_model.py +0 -196
  311. aiq/profiler/forecasting/models/random_forest_regressor.py +0 -268
  312. aiq/profiler/inference_metrics_model.py +0 -28
  313. aiq/profiler/inference_optimization/__init__.py +0 -0
  314. aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
  315. aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +0 -460
  316. aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +0 -258
  317. aiq/profiler/inference_optimization/data_models.py +0 -386
  318. aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
  319. aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +0 -468
  320. aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +0 -405
  321. aiq/profiler/inference_optimization/llm_metrics.py +0 -212
  322. aiq/profiler/inference_optimization/prompt_caching.py +0 -163
  323. aiq/profiler/inference_optimization/token_uniqueness.py +0 -107
  324. aiq/profiler/inference_optimization/workflow_runtimes.py +0 -72
  325. aiq/profiler/intermediate_property_adapter.py +0 -102
  326. aiq/profiler/profile_runner.py +0 -473
  327. aiq/profiler/utils.py +0 -184
  328. aiq/registry_handlers/__init__.py +0 -0
  329. aiq/registry_handlers/local/__init__.py +0 -0
  330. aiq/registry_handlers/local/local_handler.py +0 -176
  331. aiq/registry_handlers/local/register_local.py +0 -37
  332. aiq/registry_handlers/metadata_factory.py +0 -60
  333. aiq/registry_handlers/package_utils.py +0 -567
  334. aiq/registry_handlers/pypi/__init__.py +0 -0
  335. aiq/registry_handlers/pypi/pypi_handler.py +0 -251
  336. aiq/registry_handlers/pypi/register_pypi.py +0 -40
  337. aiq/registry_handlers/register.py +0 -21
  338. aiq/registry_handlers/registry_handler_base.py +0 -157
  339. aiq/registry_handlers/rest/__init__.py +0 -0
  340. aiq/registry_handlers/rest/register_rest.py +0 -56
  341. aiq/registry_handlers/rest/rest_handler.py +0 -237
  342. aiq/registry_handlers/schemas/__init__.py +0 -0
  343. aiq/registry_handlers/schemas/headers.py +0 -42
  344. aiq/registry_handlers/schemas/package.py +0 -68
  345. aiq/registry_handlers/schemas/publish.py +0 -63
  346. aiq/registry_handlers/schemas/pull.py +0 -82
  347. aiq/registry_handlers/schemas/remove.py +0 -36
  348. aiq/registry_handlers/schemas/search.py +0 -91
  349. aiq/registry_handlers/schemas/status.py +0 -47
  350. aiq/retriever/__init__.py +0 -0
  351. aiq/retriever/interface.py +0 -37
  352. aiq/retriever/milvus/__init__.py +0 -14
  353. aiq/retriever/milvus/register.py +0 -81
  354. aiq/retriever/milvus/retriever.py +0 -228
  355. aiq/retriever/models.py +0 -74
  356. aiq/retriever/nemo_retriever/__init__.py +0 -14
  357. aiq/retriever/nemo_retriever/register.py +0 -60
  358. aiq/retriever/nemo_retriever/retriever.py +0 -190
  359. aiq/retriever/register.py +0 -22
  360. aiq/runtime/__init__.py +0 -14
  361. aiq/runtime/loader.py +0 -215
  362. aiq/runtime/runner.py +0 -190
  363. aiq/runtime/session.py +0 -158
  364. aiq/runtime/user_metadata.py +0 -130
  365. aiq/settings/__init__.py +0 -0
  366. aiq/settings/global_settings.py +0 -318
  367. aiq/test/.namespace +0 -1
  368. aiq/tool/__init__.py +0 -0
  369. aiq/tool/chat_completion.py +0 -74
  370. aiq/tool/code_execution/README.md +0 -151
  371. aiq/tool/code_execution/__init__.py +0 -0
  372. aiq/tool/code_execution/code_sandbox.py +0 -267
  373. aiq/tool/code_execution/local_sandbox/.gitignore +0 -1
  374. aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +0 -60
  375. aiq/tool/code_execution/local_sandbox/__init__.py +0 -13
  376. aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +0 -198
  377. aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +0 -6
  378. aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +0 -50
  379. aiq/tool/code_execution/register.py +0 -74
  380. aiq/tool/code_execution/test_code_execution_sandbox.py +0 -414
  381. aiq/tool/code_execution/utils.py +0 -100
  382. aiq/tool/datetime_tools.py +0 -42
  383. aiq/tool/document_search.py +0 -141
  384. aiq/tool/github_tools/__init__.py +0 -0
  385. aiq/tool/github_tools/create_github_commit.py +0 -133
  386. aiq/tool/github_tools/create_github_issue.py +0 -87
  387. aiq/tool/github_tools/create_github_pr.py +0 -106
  388. aiq/tool/github_tools/get_github_file.py +0 -106
  389. aiq/tool/github_tools/get_github_issue.py +0 -166
  390. aiq/tool/github_tools/get_github_pr.py +0 -256
  391. aiq/tool/github_tools/update_github_issue.py +0 -100
  392. aiq/tool/mcp/__init__.py +0 -14
  393. aiq/tool/mcp/exceptions.py +0 -142
  394. aiq/tool/mcp/mcp_client.py +0 -255
  395. aiq/tool/mcp/mcp_tool.py +0 -96
  396. aiq/tool/memory_tools/__init__.py +0 -0
  397. aiq/tool/memory_tools/add_memory_tool.py +0 -79
  398. aiq/tool/memory_tools/delete_memory_tool.py +0 -67
  399. aiq/tool/memory_tools/get_memory_tool.py +0 -72
  400. aiq/tool/nvidia_rag.py +0 -95
  401. aiq/tool/register.py +0 -38
  402. aiq/tool/retriever.py +0 -89
  403. aiq/tool/server_tools.py +0 -66
  404. aiq/utils/__init__.py +0 -0
  405. aiq/utils/data_models/__init__.py +0 -0
  406. aiq/utils/data_models/schema_validator.py +0 -58
  407. aiq/utils/debugging_utils.py +0 -43
  408. aiq/utils/dump_distro_mapping.py +0 -32
  409. aiq/utils/exception_handlers/__init__.py +0 -0
  410. aiq/utils/exception_handlers/automatic_retries.py +0 -289
  411. aiq/utils/exception_handlers/mcp.py +0 -211
  412. aiq/utils/exception_handlers/schemas.py +0 -114
  413. aiq/utils/io/__init__.py +0 -0
  414. aiq/utils/io/model_processing.py +0 -28
  415. aiq/utils/io/yaml_tools.py +0 -119
  416. aiq/utils/log_utils.py +0 -37
  417. aiq/utils/metadata_utils.py +0 -74
  418. aiq/utils/optional_imports.py +0 -142
  419. aiq/utils/producer_consumer_queue.py +0 -178
  420. aiq/utils/reactive/__init__.py +0 -0
  421. aiq/utils/reactive/base/__init__.py +0 -0
  422. aiq/utils/reactive/base/observable_base.py +0 -65
  423. aiq/utils/reactive/base/observer_base.py +0 -55
  424. aiq/utils/reactive/base/subject_base.py +0 -79
  425. aiq/utils/reactive/observable.py +0 -59
  426. aiq/utils/reactive/observer.py +0 -76
  427. aiq/utils/reactive/subject.py +0 -131
  428. aiq/utils/reactive/subscription.py +0 -49
  429. aiq/utils/settings/__init__.py +0 -0
  430. aiq/utils/settings/global_settings.py +0 -197
  431. aiq/utils/string_utils.py +0 -38
  432. aiq/utils/type_converter.py +0 -290
  433. aiq/utils/type_utils.py +0 -484
  434. aiq/utils/url_utils.py +0 -27
  435. aiqtoolkit-1.2.0rc4.dist-info/METADATA +0 -363
  436. aiqtoolkit-1.2.0rc4.dist-info/RECORD +0 -438
  437. aiqtoolkit-1.2.0rc4.dist-info/entry_points.txt +0 -20
  438. aiqtoolkit-1.2.0rc4.dist-info/licenses/LICENSE-3rd-party.txt +0 -3686
  439. aiqtoolkit-1.2.0rc4.dist-info/licenses/LICENSE.md +0 -201
  440. aiqtoolkit-1.2.0rc4.dist-info/top_level.txt +0 -1
  441. {aiqtoolkit-1.2.0rc4.dist-info → aiqtoolkit-1.2rc9.dist-info}/WHEEL +0 -0
aiq/profiler/calc/plot.py DELETED
@@ -1,345 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
15
-
16
- import logging
17
- from pathlib import Path
18
-
19
- import matplotlib.pyplot as plt
20
- import numpy as np
21
- import pandas as pd
22
-
23
- from aiq.profiler.calc.data_models import LinearFitResult
24
- from aiq.profiler.calc.data_models import SizingMetrics
25
-
26
- logger = logging.getLogger(__name__)
27
-
28
-
29
- # Plotting constants
30
- class PlotConfig:
31
- # Simple plot settings
32
- SIMPLE_FIGSIZE = (12, 6)
33
- SIMPLE_LINEWIDTH = 2
34
- SIMPLE_DPI = 150
35
-
36
- # Enhanced plot settings
37
- ENHANCED_FIGSIZE = (16, 6)
38
- ENHANCED_DPI = 300
39
-
40
- # Marker and styling
41
- DATA_MARKER = 'o'
42
- OUTLIER_MARKER = 'x'
43
- OUTLIER_COLOR = 'crimson'
44
- TREND_COLOR = 'r'
45
- TREND_LINESTYLE = '--'
46
- TREND_ALPHA = 0.8
47
- TREND_LINEWIDTH = 2.0
48
-
49
- # Colors
50
- LLM_LATENCY_COLOR = 'steelblue'
51
- RUNTIME_COLOR = 'darkgreen'
52
- SLA_COLOR = 'red'
53
- NOTE_BOX_COLOR = 'mistyrose'
54
- NOTE_TEXT_COLOR = 'crimson'
55
- STATS_BOX_COLOR = 'lightblue'
56
-
57
- # Alpha values
58
- DATA_ALPHA = 0.7
59
- OUTLIER_ALPHA = 0.9
60
- GRID_ALPHA = 0.3
61
- SLA_ALPHA = 0.7
62
- NOTE_BOX_ALPHA = 0.7
63
- STATS_BOX_ALPHA = 0.8
64
-
65
- # Sizes
66
- DATA_POINT_SIZE = 120
67
- OUTLIER_POINT_SIZE = 140
68
- DATA_LINEWIDTH = 1
69
-
70
- # Font sizes
71
- AXIS_LABEL_FONTSIZE = 12
72
- TITLE_FONTSIZE = 14
73
- LEGEND_FONTSIZE = 10
74
- NOTE_FONTSIZE = 10
75
- STATS_FONTSIZE = 10
76
-
77
- # Text positioning
78
- NOTE_X_POS = 0.98
79
- NOTE_Y_POS = 0.02
80
- STATS_X_POS = 0.02
81
- STATS_Y_POS = 0.02
82
-
83
- # Box styling
84
- NOTE_BOX_PAD = 0.3
85
- STATS_BOX_PAD = 0.5
86
-
87
- # Trend line points
88
- TREND_LINE_POINTS = 100
89
-
90
- # Font weights
91
- AXIS_LABEL_FONTWEIGHT = 'bold'
92
- TITLE_FONTWEIGHT = 'bold'
93
-
94
-
95
- def plot_concurrency_vs_time_metrics_simple(df: pd.DataFrame, output_dir: Path) -> None:
96
- """
97
- Save a simple plot of concurrency vs. p95 LLM latency and workflow runtime.
98
- """
99
- plt.figure(figsize=PlotConfig.SIMPLE_FIGSIZE)
100
- plt.plot(df["concurrency"],
101
- df["llm_latency_p95"],
102
- label="p95 LLM Latency (s)",
103
- marker=PlotConfig.DATA_MARKER,
104
- linewidth=PlotConfig.SIMPLE_LINEWIDTH)
105
- plt.plot(df["concurrency"],
106
- df["workflow_runtime_p95"],
107
- label="p95 Workflow Runtime (s)",
108
- marker="s",
109
- linewidth=PlotConfig.SIMPLE_LINEWIDTH)
110
- plt.xlabel("Concurrency")
111
- plt.ylabel("Time (seconds)")
112
- plt.title("Concurrency vs. p95 LLM Latency and Workflow Runtime")
113
- plt.grid(True, alpha=PlotConfig.GRID_ALPHA)
114
- plt.legend()
115
- plt.tight_layout()
116
-
117
- simple_plot_path = output_dir / "concurrency_vs_p95_simple.png"
118
- plt.savefig(simple_plot_path, dpi=PlotConfig.SIMPLE_DPI, bbox_inches='tight')
119
- plt.close()
120
- logger.info("Simple plot saved to %s", simple_plot_path)
121
-
122
-
123
- def plot_metric_vs_concurrency_with_optional_fit(
124
- ax: plt.Axes,
125
- x: np.ndarray,
126
- y: np.ndarray,
127
- metric_name: str,
128
- y_label: str,
129
- title: str,
130
- color: str,
131
- sla_value: float = 0.0,
132
- sla_label: str = None,
133
- fit: LinearFitResult | None = None,
134
- ):
135
- """
136
- Helper to plot a metric vs concurrency with pre-computed fit, outlier highlighting, and SLA line.
137
- Requires pre-computed fit to be provided.
138
- """
139
- marker = PlotConfig.DATA_MARKER
140
- outlier_marker = PlotConfig.OUTLIER_MARKER
141
- outlier_color = PlotConfig.OUTLIER_COLOR
142
- trend_color = PlotConfig.TREND_COLOR
143
- trend_linestyle = PlotConfig.TREND_LINESTYLE
144
- trend_alpha = PlotConfig.TREND_ALPHA
145
- trend_linewidth = PlotConfig.TREND_LINEWIDTH
146
- note_box_color = PlotConfig.NOTE_BOX_COLOR
147
- note_text_color = PlotConfig.NOTE_TEXT_COLOR
148
- legend_fontsize = PlotConfig.LEGEND_FONTSIZE
149
- outliers_x = outliers_y = np.array([])
150
- outliers_note = ""
151
-
152
- # Skip analysis plot if no fit is available
153
- if not fit:
154
- logger.warning(f"No linear fit available for {metric_name}, skipping analysis plot")
155
- return False
156
-
157
- if fit.outliers_removed:
158
- # Use the concurrencies that were removed to identify outlier points
159
- outlier_mask = np.isin(x, fit.outliers_removed)
160
- outliers_x = x[outlier_mask]
161
- outliers_y = y[outlier_mask]
162
- outliers_note = f"Outliers removed: concurrencies {fit.outliers_removed}"
163
- # Plot cleaned data (points that weren't removed as outliers)
164
- non_outlier_mask = ~np.isin(x, fit.outliers_removed)
165
- x_clean = x[non_outlier_mask]
166
- y_clean = y[non_outlier_mask]
167
- ax.scatter(x_clean,
168
- y_clean,
169
- alpha=PlotConfig.DATA_ALPHA,
170
- s=PlotConfig.DATA_POINT_SIZE,
171
- c=color,
172
- edgecolors='white',
173
- linewidth=PlotConfig.DATA_LINEWIDTH,
174
- marker=marker,
175
- label='Data Points')
176
- ax.scatter(outliers_x,
177
- outliers_y,
178
- alpha=PlotConfig.OUTLIER_ALPHA,
179
- s=PlotConfig.OUTLIER_POINT_SIZE,
180
- c=outlier_color,
181
- marker=outlier_marker,
182
- label='Removed Outliers')
183
- else:
184
- # No outliers plot all data points
185
- ax.scatter(x,
186
- y,
187
- alpha=PlotConfig.DATA_ALPHA,
188
- s=PlotConfig.DATA_POINT_SIZE,
189
- c=color,
190
- edgecolors='white',
191
- linewidth=PlotConfig.DATA_LINEWIDTH,
192
- marker=marker,
193
- label='Data Points')
194
-
195
- # Plot trend line using the fit
196
- x_fit = np.linspace(x.min(), x.max(), PlotConfig.TREND_LINE_POINTS)
197
- y_fit = fit.slope * x_fit + fit.intercept
198
- ax.plot(x_fit,
199
- y_fit,
200
- trend_linestyle,
201
- alpha=trend_alpha,
202
- linewidth=trend_linewidth,
203
- color=trend_color,
204
- label=f'Trend (slope={fit.slope:.4f}, R²={fit.r_squared:.3f})')
205
-
206
- if sla_value > 0:
207
- ax.axhline(y=sla_value,
208
- color=PlotConfig.SLA_COLOR,
209
- linestyle=':',
210
- alpha=PlotConfig.SLA_ALPHA,
211
- linewidth=2,
212
- label=sla_label or f'SLA Threshold ({sla_value}s)')
213
-
214
- ax.set_xlabel('Concurrency', fontsize=PlotConfig.AXIS_LABEL_FONTSIZE, fontweight=PlotConfig.AXIS_LABEL_FONTWEIGHT)
215
- ax.set_ylabel(y_label, fontsize=PlotConfig.AXIS_LABEL_FONTSIZE, fontweight=PlotConfig.AXIS_LABEL_FONTWEIGHT)
216
- ax.set_title(title, fontsize=PlotConfig.TITLE_FONTSIZE, fontweight=PlotConfig.TITLE_FONTWEIGHT)
217
- ax.grid(True, alpha=PlotConfig.GRID_ALPHA)
218
- ax.legend(fontsize=legend_fontsize)
219
- if outliers_note:
220
- ax.text(PlotConfig.NOTE_X_POS,
221
- PlotConfig.NOTE_Y_POS,
222
- outliers_note,
223
- transform=ax.transAxes,
224
- fontsize=PlotConfig.NOTE_FONTSIZE,
225
- color=note_text_color,
226
- ha='right',
227
- va='bottom',
228
- bbox=dict(boxstyle=f'round,pad={PlotConfig.NOTE_BOX_PAD}',
229
- facecolor=note_box_color,
230
- alpha=PlotConfig.NOTE_BOX_ALPHA))
231
-
232
- return True
233
-
234
-
235
- def plot_concurrency_vs_time_metrics(metrics_per_concurrency: dict[int, SizingMetrics],
236
- output_dir: Path,
237
- target_llm_latency: float = 0.0,
238
- target_runtime: float = 0.0,
239
- llm_latency_fit: LinearFitResult | None = None,
240
- runtime_fit: LinearFitResult | None = None) -> None:
241
- """
242
- Plot concurrency vs. p95 latency and workflow runtime using metrics_per_concurrency.
243
- Enhanced with better styling, trend analysis, and annotations.
244
- Only plots valid runs and requires pre-computed fits.
245
- """
246
- rows = []
247
-
248
- for concurrency, metrics in metrics_per_concurrency.items():
249
- llm_latency = metrics.llm_latency_p95
250
- workflow_runtime = metrics.workflow_runtime_p95
251
-
252
- rows.append({
253
- "concurrency": concurrency, "llm_latency_p95": llm_latency, "workflow_runtime_p95": workflow_runtime
254
- })
255
-
256
- if not rows:
257
- logger.warning("No valid metrics data available to plot.")
258
- return
259
-
260
- plt.style.use('seaborn-v0_8')
261
- df = pd.DataFrame(rows).sort_values("concurrency")
262
-
263
- # Always generate simple plot first
264
- plot_concurrency_vs_time_metrics_simple(df, output_dir)
265
-
266
- # Check if we have fits available for analysis plots
267
- has_llm_latency_fit = llm_latency_fit is not None
268
- has_runtime_fit = runtime_fit is not None
269
-
270
- if not has_llm_latency_fit and not has_runtime_fit:
271
- logger.warning("No linear fits available for analysis plots, skipping enhanced plot")
272
- return
273
-
274
- # Create subplots based on available fits
275
- if has_llm_latency_fit and has_runtime_fit:
276
- fig, (ax1, ax2) = plt.subplots(1, 2, figsize=PlotConfig.ENHANCED_FIGSIZE)
277
- else:
278
- fig, ax1 = plt.subplots(1, 1, figsize=(8, 6))
279
- ax2 = None
280
-
281
- # Plot llm_latency if fit is available
282
- llm_latency_plotted = False
283
- if has_llm_latency_fit:
284
- llm_latency_plotted = plot_metric_vs_concurrency_with_optional_fit(
285
- ax1,
286
- df["concurrency"].to_numpy(),
287
- df["llm_latency_p95"].to_numpy(),
288
- metric_name="llm_latency",
289
- y_label='P95 LLM Latency (seconds)',
290
- title='Concurrency vs P95 LLM Latency',
291
- color=PlotConfig.LLM_LATENCY_COLOR,
292
- sla_value=target_llm_latency,
293
- sla_label=f'SLA Threshold ({target_llm_latency}s)' if target_llm_latency > 0 else None,
294
- fit=llm_latency_fit,
295
- )
296
-
297
- # Plot runtime if fit is available
298
- runtime_plotted = False
299
- if has_runtime_fit and ax2 is not None:
300
- runtime_plotted = plot_metric_vs_concurrency_with_optional_fit(
301
- ax2,
302
- df["concurrency"].to_numpy(),
303
- df["workflow_runtime_p95"].to_numpy(),
304
- metric_name="runtime",
305
- y_label='P95 Workflow Runtime (seconds)',
306
- title='Concurrency vs P95 Workflow Runtime',
307
- color=PlotConfig.RUNTIME_COLOR,
308
- sla_value=target_runtime,
309
- sla_label=f'SLA Threshold ({target_runtime}s)' if target_runtime > 0 else None,
310
- fit=runtime_fit,
311
- )
312
-
313
- # Check if any plots were successfully created
314
- plots_created = (llm_latency_plotted or runtime_plotted)
315
-
316
- if not plots_created:
317
- logger.warning("No analysis plots could be created, skipping enhanced plot")
318
- plt.close(fig)
319
- return
320
-
321
- # Add summary statistics
322
- stats_text = f'Data Points: {len(df)}\n'
323
- stats_text += f'LLM Latency Range: {df["llm_latency_p95"].min():.3f}-{df["llm_latency_p95"].max():.3f}s\n'
324
- stats_text += f'WF Runtime Range: {df["workflow_runtime_p95"].min():.3f}-{df["workflow_runtime_p95"].max():.3f}s'
325
-
326
- fig.text(PlotConfig.STATS_X_POS,
327
- PlotConfig.STATS_Y_POS,
328
- stats_text,
329
- fontsize=PlotConfig.STATS_FONTSIZE,
330
- bbox=dict(boxstyle=f'round,pad={PlotConfig.STATS_BOX_PAD}',
331
- facecolor=PlotConfig.STATS_BOX_COLOR,
332
- alpha=PlotConfig.STATS_BOX_ALPHA))
333
-
334
- plt.tight_layout()
335
- output_dir.mkdir(parents=True, exist_ok=True)
336
-
337
- enhanced_plot_path = output_dir / "concurrency_vs_p95_analysis.png"
338
- plt.savefig(enhanced_plot_path,
339
- dpi=PlotConfig.ENHANCED_DPI,
340
- bbox_inches='tight',
341
- facecolor='white',
342
- edgecolor='none')
343
- plt.close()
344
-
345
- logger.info("Enhanced plot saved to %s", enhanced_plot_path)
File without changes
@@ -1,295 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
15
-
16
- import copy
17
- import logging
18
- import threading
19
- import time
20
- from collections.abc import Callable
21
- from typing import Any
22
- from uuid import uuid4
23
-
24
- import litellm
25
-
26
- from aiq.builder.context import AIQContext
27
- from aiq.builder.framework_enum import LLMFrameworkEnum
28
- from aiq.data_models.intermediate_step import IntermediateStepPayload
29
- from aiq.data_models.intermediate_step import IntermediateStepType
30
- from aiq.data_models.intermediate_step import StreamEventData
31
- from aiq.data_models.intermediate_step import TraceMetadata
32
- from aiq.data_models.intermediate_step import UsageInfo
33
- from aiq.profiler.callbacks.base_callback_class import BaseProfilerCallback
34
- from aiq.profiler.callbacks.token_usage_base_model import TokenUsageBaseModel
35
-
36
- logger = logging.getLogger(__name__)
37
-
38
-
39
- class AgnoProfilerHandler(BaseProfilerCallback):
40
- """
41
- A callback manager/handler for Agno that intercepts calls to:
42
-
43
- - Tool execution
44
- - LLM Calls
45
-
46
- to collect usage statistics (tokens, inputs, outputs, time intervals, etc.)
47
- and store them in AIQ Toolkit's usage_stats queue for subsequent analysis.
48
- """
49
-
50
- def __init__(self) -> None:
51
- super().__init__()
52
- self._lock = threading.Lock()
53
- self.last_call_ts = time.time()
54
- self.step_manager = AIQContext.get().intermediate_step_manager
55
-
56
- # Original references to Agno methods (for uninstrumenting if needed)
57
- self._original_tool_execute = None
58
- self._original_llm_call = None
59
-
60
- def instrument(self) -> None:
61
- """
62
- Monkey-patch the relevant Agno methods with usage-stat collection logic.
63
- """
64
- # Save the originals and apply patches
65
- self._original_llm_call = getattr(litellm, "completion", None)
66
-
67
- # Patch LLM completion if available
68
- if self._original_llm_call:
69
- litellm.completion = self._llm_call_monkey_patch()
70
- logger.debug("AgnoProfilerHandler LLM call instrumentation applied successfully.")
71
- else:
72
- logger.debug("Could not patch Agno LLM calls: litellm.completion not found")
73
-
74
- # Note: Agno doesn't have a class-based tool structure to patch directly.
75
- # Instead, it uses decorators to convert functions to tools.
76
- # In AIQ Toolkit, tool executions are captured at the execute_agno_tool level
77
- # in packages/aiqtoolkit_agno/src/aiq/plugins/agno/tool_wrapper.py
78
-
79
- # To properly monitor Agno tool executions, we would need to either:
80
- # 1. Patch the execute_agno_tool function in tool_wrapper.py
81
- # 2. Add explicit instrumentation in that function to push events to the step manager
82
- # 3. Or, if Agno updates to have a class-based tool structure, update this handler
83
- # to patch those classes
84
-
85
- # Recommended future enhancement:
86
- # The execute_agno_tool function in packages/aiqtoolkit_agno/src/aiq/plugins/agno/tool_wrapper.py
87
- # should be updated to directly push IntermediateStepPayload events to the step manager
88
- # at the beginning and end of tool execution, similar to what this handler does for LLM calls.
89
-
90
- logger.debug("AgnoProfilerHandler instrumentation completed.")
91
-
92
- def _tool_execute_monkey_patch(self) -> Callable[..., Any]:
93
- """
94
- Returns a function that wraps tool execution calls with usage-logging.
95
-
96
- Note: This method is currently not used in the instrument() function since
97
- Agno doesn't have a class-based tool structure to patch. It's kept for
98
- reference or future use if Agno changes its architecture.
99
- """
100
- original_func = self._original_tool_execute
101
-
102
- def wrapped_tool_execute(*args, **kwargs) -> Any:
103
- """
104
- Collects usage stats for tool execution, calls the original, and captures output stats.
105
- """
106
- now = time.time()
107
- tool_name = kwargs.get("tool_name", "")
108
- uuid = str(uuid4())
109
-
110
- try:
111
- # Pre-call usage event
112
- stats = IntermediateStepPayload(event_type=IntermediateStepType.TOOL_START,
113
- framework=LLMFrameworkEnum.AGNO,
114
- name=tool_name,
115
- UUID=uuid,
116
- data=StreamEventData(),
117
- metadata=TraceMetadata(tool_inputs={
118
- "args": args, "kwargs": dict(kwargs)
119
- }),
120
- usage_info=UsageInfo(token_usage=TokenUsageBaseModel()))
121
-
122
- self.step_manager.push_intermediate_step(stats)
123
- self.last_call_ts = now
124
-
125
- # Call the original execute
126
- result = original_func(*args, **kwargs)
127
- now = time.time()
128
-
129
- # Post-call usage stats
130
- usage_stat = IntermediateStepPayload(
131
- event_type=IntermediateStepType.TOOL_END,
132
- span_event_timestamp=now,
133
- framework=LLMFrameworkEnum.AGNO,
134
- name=tool_name,
135
- UUID=uuid,
136
- data=StreamEventData(input={
137
- "args": args, "kwargs": dict(kwargs)
138
- }, output=str(result)),
139
- metadata=TraceMetadata(tool_outputs={"result": str(result)}),
140
- usage_info=UsageInfo(token_usage=TokenUsageBaseModel()),
141
- )
142
-
143
- self.step_manager.push_intermediate_step(usage_stat)
144
- return result
145
-
146
- except Exception as e:
147
- logger.exception("Tool execution error: %s", e)
148
- raise
149
-
150
- return wrapped_tool_execute
151
-
152
- def _llm_call_monkey_patch(self) -> Callable[..., Any]:
153
- """
154
- Returns a function that wraps calls to litellm.completion(...) with usage-logging.
155
- """
156
- original_func = self._original_llm_call
157
-
158
- def wrapped_llm_call(*args, **kwargs) -> Any:
159
- """
160
- Collects usage stats for LLM calls, calls the original, and captures output stats.
161
- """
162
- now = time.time()
163
- seconds_between_calls = int(now - self.last_call_ts)
164
- model_name = kwargs.get('model', "")
165
-
166
- model_input = ""
167
- try:
168
- for message in kwargs.get('messages', []):
169
- model_input += message.get('content', "")
170
- except Exception as e:
171
- logger.exception("Error getting model input: %s", e)
172
-
173
- uuid = str(uuid4())
174
-
175
- # Record the start event
176
- input_stats = IntermediateStepPayload(
177
- event_type=IntermediateStepType.LLM_START,
178
- framework=LLMFrameworkEnum.AGNO,
179
- name=model_name,
180
- UUID=uuid,
181
- data=StreamEventData(input=model_input),
182
- metadata=TraceMetadata(chat_inputs=copy.deepcopy(kwargs.get('messages', []))),
183
- usage_info=UsageInfo(token_usage=TokenUsageBaseModel(),
184
- num_llm_calls=1,
185
- seconds_between_calls=seconds_between_calls))
186
-
187
- self.step_manager.push_intermediate_step(input_stats)
188
-
189
- # Verify we have a valid original function before calling it
190
- if original_func is None:
191
- logger.error("Original litellm.completion function is None - cannot call it")
192
- output = None
193
- else:
194
- # Call the original litellm.completion(...)
195
- logger.debug(
196
- f"Calling litellm.completion for {model_name} with {len(args)} args and {len(kwargs)} kwargs")
197
- try:
198
- output = original_func(*args, **kwargs)
199
- logger.debug(f"Original litellm.completion returned: {type(output)}")
200
- except Exception as e:
201
- logger.exception(f"Error calling original litellm.completion: {e}")
202
- output = None
203
-
204
- # Initialize default values
205
- model_output = ""
206
- chat_responses = None
207
- token_usage = TokenUsageBaseModel()
208
-
209
- # Log what we received to help with debugging
210
- logger.debug(f"LLM call to {model_name} received output type: {type(output)}")
211
-
212
- # Safely process the output if it's not None
213
- if output is not None:
214
- try:
215
- # Extract model output text from choices
216
- if hasattr(output, 'choices') and output.choices:
217
- logger.debug(f"Output has {len(output.choices)} choices")
218
- for i, choice in enumerate(output.choices):
219
- logger.debug(f"Processing choice {i} of type {type(choice)}")
220
- if hasattr(choice, 'model_extra') and 'message' in choice.model_extra:
221
- msg = choice.model_extra["message"]
222
- content = msg.get('content', "")
223
- logger.debug(f"Got content from model_extra.message: {content[:50]}...")
224
- model_output += content
225
- elif hasattr(choice, 'message') and hasattr(choice.message, 'content'):
226
- content = choice.message.content or ""
227
- logger.debug(f"Got content from message.content: {content[:50]}...")
228
- model_output += content
229
- else:
230
- logger.debug(f"Could not extract content from choice: {choice}")
231
-
232
- # Try to get chat responses
233
- if hasattr(output, 'choices') and len(output.choices) > 0:
234
- choice = output.choices[0]
235
- if hasattr(choice, 'model_dump'):
236
- logger.debug("Using model_dump to extract chat responses")
237
- chat_responses = choice.model_dump()
238
- else:
239
- # Fall back to a simpler representation
240
- logger.debug("Falling back to simple representation for chat responses")
241
- chat_responses = {"content": model_output}
242
-
243
- # Try to get token usage
244
- if hasattr(output, 'model_extra') and 'usage' in output.model_extra:
245
- usage_data = output.model_extra['usage']
246
- logger.debug(f"Found usage data of type {type(usage_data)}")
247
-
248
- # Special debug for the test case
249
- if hasattr(usage_data, 'prompt_tokens'
250
- ) and usage_data.prompt_tokens == 20 and usage_data.completion_tokens == 15:
251
- logger.debug("Found test case token usage object with 20/15/35 tokens")
252
-
253
- if hasattr(usage_data, 'model_dump'):
254
- logger.debug("Using model_dump to extract token usage")
255
- token_usage = TokenUsageBaseModel(**usage_data.model_dump())
256
- elif isinstance(usage_data, dict):
257
- logger.debug("Extracting token usage from dictionary")
258
- token_usage = TokenUsageBaseModel(prompt_tokens=usage_data.get('prompt_tokens', 0),
259
- completion_tokens=usage_data.get('completion_tokens', 0),
260
- total_tokens=usage_data.get('total_tokens', 0))
261
- elif isinstance(usage_data, TokenUsageBaseModel):
262
- # If it's already a TokenUsageBaseModel instance, use it directly
263
- logger.debug("Using TokenUsageBaseModel directly")
264
- token_usage = usage_data
265
- elif hasattr(usage_data, 'prompt_tokens') and hasattr(
266
- usage_data, 'completion_tokens') and hasattr(usage_data, 'total_tokens'):
267
- # For objects that have the needed properties but aren't TokenUsageBaseModel
268
- logger.debug("Using object with token properties")
269
- token_usage = TokenUsageBaseModel(prompt_tokens=usage_data.prompt_tokens,
270
- completion_tokens=usage_data.completion_tokens,
271
- total_tokens=usage_data.total_tokens)
272
-
273
- logger.debug(f"Final token usage: prompt={token_usage.prompt_tokens}, "
274
- f"completion={token_usage.completion_tokens}, "
275
- f"total={token_usage.total_tokens}")
276
- except Exception as e:
277
- logger.exception("Error getting model output: %s", e)
278
-
279
- now = time.time()
280
- # Record the end event
281
- output_stats = IntermediateStepPayload(event_type=IntermediateStepType.LLM_END,
282
- span_event_timestamp=now,
283
- framework=LLMFrameworkEnum.AGNO,
284
- name=model_name,
285
- UUID=uuid,
286
- data=StreamEventData(input=model_input, output=model_output),
287
- metadata=TraceMetadata(chat_responses=chat_responses),
288
- usage_info=UsageInfo(token_usage=token_usage,
289
- num_llm_calls=1,
290
- seconds_between_calls=seconds_between_calls))
291
-
292
- self.step_manager.push_intermediate_step(output_stats)
293
- return output
294
-
295
- return wrapped_llm_call
@@ -1,20 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
15
-
16
- from abc import ABC
17
-
18
-
19
- class BaseProfilerCallback(ABC):
20
- pass