aiqtoolkit 1.2.0rc4__py3-none-any.whl → 1.2.0rc5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of aiqtoolkit might be problematic. Click here for more details.

Files changed (441) hide show
  1. aiqtoolkit-1.2.0rc5.dist-info/METADATA +29 -0
  2. aiqtoolkit-1.2.0rc5.dist-info/RECORD +4 -0
  3. aiqtoolkit-1.2.0rc5.dist-info/top_level.txt +1 -0
  4. aiq/agent/__init__.py +0 -0
  5. aiq/agent/base.py +0 -239
  6. aiq/agent/dual_node.py +0 -67
  7. aiq/agent/react_agent/__init__.py +0 -0
  8. aiq/agent/react_agent/agent.py +0 -355
  9. aiq/agent/react_agent/output_parser.py +0 -104
  10. aiq/agent/react_agent/prompt.py +0 -41
  11. aiq/agent/react_agent/register.py +0 -149
  12. aiq/agent/reasoning_agent/__init__.py +0 -0
  13. aiq/agent/reasoning_agent/reasoning_agent.py +0 -225
  14. aiq/agent/register.py +0 -23
  15. aiq/agent/rewoo_agent/__init__.py +0 -0
  16. aiq/agent/rewoo_agent/agent.py +0 -411
  17. aiq/agent/rewoo_agent/prompt.py +0 -108
  18. aiq/agent/rewoo_agent/register.py +0 -158
  19. aiq/agent/tool_calling_agent/__init__.py +0 -0
  20. aiq/agent/tool_calling_agent/agent.py +0 -119
  21. aiq/agent/tool_calling_agent/register.py +0 -106
  22. aiq/authentication/__init__.py +0 -14
  23. aiq/authentication/api_key/__init__.py +0 -14
  24. aiq/authentication/api_key/api_key_auth_provider.py +0 -96
  25. aiq/authentication/api_key/api_key_auth_provider_config.py +0 -124
  26. aiq/authentication/api_key/register.py +0 -26
  27. aiq/authentication/exceptions/__init__.py +0 -14
  28. aiq/authentication/exceptions/api_key_exceptions.py +0 -38
  29. aiq/authentication/exceptions/auth_code_grant_exceptions.py +0 -86
  30. aiq/authentication/exceptions/call_back_exceptions.py +0 -38
  31. aiq/authentication/exceptions/request_exceptions.py +0 -54
  32. aiq/authentication/http_basic_auth/__init__.py +0 -0
  33. aiq/authentication/http_basic_auth/http_basic_auth_provider.py +0 -81
  34. aiq/authentication/http_basic_auth/register.py +0 -30
  35. aiq/authentication/interfaces.py +0 -93
  36. aiq/authentication/oauth2/__init__.py +0 -14
  37. aiq/authentication/oauth2/oauth2_auth_code_flow_provider.py +0 -107
  38. aiq/authentication/oauth2/oauth2_auth_code_flow_provider_config.py +0 -39
  39. aiq/authentication/oauth2/register.py +0 -25
  40. aiq/authentication/register.py +0 -21
  41. aiq/builder/__init__.py +0 -0
  42. aiq/builder/builder.py +0 -285
  43. aiq/builder/component_utils.py +0 -316
  44. aiq/builder/context.py +0 -264
  45. aiq/builder/embedder.py +0 -24
  46. aiq/builder/eval_builder.py +0 -161
  47. aiq/builder/evaluator.py +0 -29
  48. aiq/builder/framework_enum.py +0 -24
  49. aiq/builder/front_end.py +0 -73
  50. aiq/builder/function.py +0 -344
  51. aiq/builder/function_base.py +0 -380
  52. aiq/builder/function_info.py +0 -627
  53. aiq/builder/intermediate_step_manager.py +0 -174
  54. aiq/builder/llm.py +0 -25
  55. aiq/builder/retriever.py +0 -25
  56. aiq/builder/user_interaction_manager.py +0 -74
  57. aiq/builder/workflow.py +0 -148
  58. aiq/builder/workflow_builder.py +0 -1117
  59. aiq/cli/__init__.py +0 -14
  60. aiq/cli/cli_utils/__init__.py +0 -0
  61. aiq/cli/cli_utils/config_override.py +0 -231
  62. aiq/cli/cli_utils/validation.py +0 -37
  63. aiq/cli/commands/__init__.py +0 -0
  64. aiq/cli/commands/configure/__init__.py +0 -0
  65. aiq/cli/commands/configure/channel/__init__.py +0 -0
  66. aiq/cli/commands/configure/channel/add.py +0 -28
  67. aiq/cli/commands/configure/channel/channel.py +0 -36
  68. aiq/cli/commands/configure/channel/remove.py +0 -30
  69. aiq/cli/commands/configure/channel/update.py +0 -30
  70. aiq/cli/commands/configure/configure.py +0 -33
  71. aiq/cli/commands/evaluate.py +0 -139
  72. aiq/cli/commands/info/__init__.py +0 -14
  73. aiq/cli/commands/info/info.py +0 -39
  74. aiq/cli/commands/info/list_channels.py +0 -32
  75. aiq/cli/commands/info/list_components.py +0 -129
  76. aiq/cli/commands/info/list_mcp.py +0 -213
  77. aiq/cli/commands/registry/__init__.py +0 -14
  78. aiq/cli/commands/registry/publish.py +0 -88
  79. aiq/cli/commands/registry/pull.py +0 -118
  80. aiq/cli/commands/registry/registry.py +0 -38
  81. aiq/cli/commands/registry/remove.py +0 -108
  82. aiq/cli/commands/registry/search.py +0 -155
  83. aiq/cli/commands/sizing/__init__.py +0 -14
  84. aiq/cli/commands/sizing/calc.py +0 -297
  85. aiq/cli/commands/sizing/sizing.py +0 -27
  86. aiq/cli/commands/start.py +0 -246
  87. aiq/cli/commands/uninstall.py +0 -81
  88. aiq/cli/commands/validate.py +0 -47
  89. aiq/cli/commands/workflow/__init__.py +0 -14
  90. aiq/cli/commands/workflow/templates/__init__.py.j2 +0 -0
  91. aiq/cli/commands/workflow/templates/config.yml.j2 +0 -16
  92. aiq/cli/commands/workflow/templates/pyproject.toml.j2 +0 -22
  93. aiq/cli/commands/workflow/templates/register.py.j2 +0 -5
  94. aiq/cli/commands/workflow/templates/workflow.py.j2 +0 -36
  95. aiq/cli/commands/workflow/workflow.py +0 -37
  96. aiq/cli/commands/workflow/workflow_commands.py +0 -313
  97. aiq/cli/entrypoint.py +0 -135
  98. aiq/cli/main.py +0 -44
  99. aiq/cli/register_workflow.py +0 -488
  100. aiq/cli/type_registry.py +0 -1000
  101. aiq/data_models/__init__.py +0 -14
  102. aiq/data_models/api_server.py +0 -694
  103. aiq/data_models/authentication.py +0 -231
  104. aiq/data_models/common.py +0 -171
  105. aiq/data_models/component.py +0 -54
  106. aiq/data_models/component_ref.py +0 -168
  107. aiq/data_models/config.py +0 -406
  108. aiq/data_models/dataset_handler.py +0 -123
  109. aiq/data_models/discovery_metadata.py +0 -335
  110. aiq/data_models/embedder.py +0 -27
  111. aiq/data_models/evaluate.py +0 -127
  112. aiq/data_models/evaluator.py +0 -26
  113. aiq/data_models/front_end.py +0 -26
  114. aiq/data_models/function.py +0 -30
  115. aiq/data_models/function_dependencies.py +0 -72
  116. aiq/data_models/interactive.py +0 -246
  117. aiq/data_models/intermediate_step.py +0 -302
  118. aiq/data_models/invocation_node.py +0 -38
  119. aiq/data_models/its_strategy.py +0 -30
  120. aiq/data_models/llm.py +0 -27
  121. aiq/data_models/logging.py +0 -26
  122. aiq/data_models/memory.py +0 -27
  123. aiq/data_models/object_store.py +0 -44
  124. aiq/data_models/profiler.py +0 -54
  125. aiq/data_models/registry_handler.py +0 -26
  126. aiq/data_models/retriever.py +0 -30
  127. aiq/data_models/retry_mixin.py +0 -35
  128. aiq/data_models/span.py +0 -187
  129. aiq/data_models/step_adaptor.py +0 -64
  130. aiq/data_models/streaming.py +0 -33
  131. aiq/data_models/swe_bench_model.py +0 -54
  132. aiq/data_models/telemetry_exporter.py +0 -26
  133. aiq/embedder/__init__.py +0 -0
  134. aiq/embedder/langchain_client.py +0 -41
  135. aiq/embedder/nim_embedder.py +0 -59
  136. aiq/embedder/openai_embedder.py +0 -43
  137. aiq/embedder/register.py +0 -24
  138. aiq/eval/__init__.py +0 -14
  139. aiq/eval/config.py +0 -60
  140. aiq/eval/dataset_handler/__init__.py +0 -0
  141. aiq/eval/dataset_handler/dataset_downloader.py +0 -106
  142. aiq/eval/dataset_handler/dataset_filter.py +0 -52
  143. aiq/eval/dataset_handler/dataset_handler.py +0 -254
  144. aiq/eval/evaluate.py +0 -506
  145. aiq/eval/evaluator/__init__.py +0 -14
  146. aiq/eval/evaluator/base_evaluator.py +0 -73
  147. aiq/eval/evaluator/evaluator_model.py +0 -45
  148. aiq/eval/intermediate_step_adapter.py +0 -99
  149. aiq/eval/rag_evaluator/__init__.py +0 -0
  150. aiq/eval/rag_evaluator/evaluate.py +0 -178
  151. aiq/eval/rag_evaluator/register.py +0 -143
  152. aiq/eval/register.py +0 -23
  153. aiq/eval/remote_workflow.py +0 -133
  154. aiq/eval/runners/__init__.py +0 -14
  155. aiq/eval/runners/config.py +0 -39
  156. aiq/eval/runners/multi_eval_runner.py +0 -54
  157. aiq/eval/runtime_event_subscriber.py +0 -52
  158. aiq/eval/swe_bench_evaluator/__init__.py +0 -0
  159. aiq/eval/swe_bench_evaluator/evaluate.py +0 -215
  160. aiq/eval/swe_bench_evaluator/register.py +0 -36
  161. aiq/eval/trajectory_evaluator/__init__.py +0 -0
  162. aiq/eval/trajectory_evaluator/evaluate.py +0 -75
  163. aiq/eval/trajectory_evaluator/register.py +0 -40
  164. aiq/eval/tunable_rag_evaluator/__init__.py +0 -0
  165. aiq/eval/tunable_rag_evaluator/evaluate.py +0 -245
  166. aiq/eval/tunable_rag_evaluator/register.py +0 -52
  167. aiq/eval/usage_stats.py +0 -41
  168. aiq/eval/utils/__init__.py +0 -0
  169. aiq/eval/utils/output_uploader.py +0 -140
  170. aiq/eval/utils/tqdm_position_registry.py +0 -40
  171. aiq/eval/utils/weave_eval.py +0 -184
  172. aiq/experimental/__init__.py +0 -0
  173. aiq/experimental/decorators/__init__.py +0 -0
  174. aiq/experimental/decorators/experimental_warning_decorator.py +0 -130
  175. aiq/experimental/inference_time_scaling/__init__.py +0 -0
  176. aiq/experimental/inference_time_scaling/editing/__init__.py +0 -0
  177. aiq/experimental/inference_time_scaling/editing/iterative_plan_refinement_editor.py +0 -147
  178. aiq/experimental/inference_time_scaling/editing/llm_as_a_judge_editor.py +0 -204
  179. aiq/experimental/inference_time_scaling/editing/motivation_aware_summarization.py +0 -107
  180. aiq/experimental/inference_time_scaling/functions/__init__.py +0 -0
  181. aiq/experimental/inference_time_scaling/functions/execute_score_select_function.py +0 -105
  182. aiq/experimental/inference_time_scaling/functions/its_tool_orchestration_function.py +0 -205
  183. aiq/experimental/inference_time_scaling/functions/its_tool_wrapper_function.py +0 -146
  184. aiq/experimental/inference_time_scaling/functions/plan_select_execute_function.py +0 -224
  185. aiq/experimental/inference_time_scaling/models/__init__.py +0 -0
  186. aiq/experimental/inference_time_scaling/models/editor_config.py +0 -132
  187. aiq/experimental/inference_time_scaling/models/its_item.py +0 -48
  188. aiq/experimental/inference_time_scaling/models/scoring_config.py +0 -112
  189. aiq/experimental/inference_time_scaling/models/search_config.py +0 -120
  190. aiq/experimental/inference_time_scaling/models/selection_config.py +0 -154
  191. aiq/experimental/inference_time_scaling/models/stage_enums.py +0 -43
  192. aiq/experimental/inference_time_scaling/models/strategy_base.py +0 -66
  193. aiq/experimental/inference_time_scaling/models/tool_use_config.py +0 -41
  194. aiq/experimental/inference_time_scaling/register.py +0 -36
  195. aiq/experimental/inference_time_scaling/scoring/__init__.py +0 -0
  196. aiq/experimental/inference_time_scaling/scoring/llm_based_agent_scorer.py +0 -168
  197. aiq/experimental/inference_time_scaling/scoring/llm_based_plan_scorer.py +0 -168
  198. aiq/experimental/inference_time_scaling/scoring/motivation_aware_scorer.py +0 -111
  199. aiq/experimental/inference_time_scaling/search/__init__.py +0 -0
  200. aiq/experimental/inference_time_scaling/search/multi_llm_planner.py +0 -128
  201. aiq/experimental/inference_time_scaling/search/multi_query_retrieval_search.py +0 -122
  202. aiq/experimental/inference_time_scaling/search/single_shot_multi_plan_planner.py +0 -128
  203. aiq/experimental/inference_time_scaling/selection/__init__.py +0 -0
  204. aiq/experimental/inference_time_scaling/selection/best_of_n_selector.py +0 -63
  205. aiq/experimental/inference_time_scaling/selection/llm_based_agent_output_selector.py +0 -131
  206. aiq/experimental/inference_time_scaling/selection/llm_based_output_merging_selector.py +0 -159
  207. aiq/experimental/inference_time_scaling/selection/llm_based_plan_selector.py +0 -128
  208. aiq/experimental/inference_time_scaling/selection/threshold_selector.py +0 -58
  209. aiq/front_ends/__init__.py +0 -14
  210. aiq/front_ends/console/__init__.py +0 -14
  211. aiq/front_ends/console/authentication_flow_handler.py +0 -233
  212. aiq/front_ends/console/console_front_end_config.py +0 -32
  213. aiq/front_ends/console/console_front_end_plugin.py +0 -96
  214. aiq/front_ends/console/register.py +0 -25
  215. aiq/front_ends/cron/__init__.py +0 -14
  216. aiq/front_ends/fastapi/__init__.py +0 -14
  217. aiq/front_ends/fastapi/auth_flow_handlers/__init__.py +0 -0
  218. aiq/front_ends/fastapi/auth_flow_handlers/http_flow_handler.py +0 -27
  219. aiq/front_ends/fastapi/auth_flow_handlers/websocket_flow_handler.py +0 -107
  220. aiq/front_ends/fastapi/fastapi_front_end_config.py +0 -234
  221. aiq/front_ends/fastapi/fastapi_front_end_controller.py +0 -68
  222. aiq/front_ends/fastapi/fastapi_front_end_plugin.py +0 -116
  223. aiq/front_ends/fastapi/fastapi_front_end_plugin_worker.py +0 -1092
  224. aiq/front_ends/fastapi/html_snippets/__init__.py +0 -14
  225. aiq/front_ends/fastapi/html_snippets/auth_code_grant_success.py +0 -35
  226. aiq/front_ends/fastapi/intermediate_steps_subscriber.py +0 -80
  227. aiq/front_ends/fastapi/job_store.py +0 -183
  228. aiq/front_ends/fastapi/main.py +0 -72
  229. aiq/front_ends/fastapi/message_handler.py +0 -298
  230. aiq/front_ends/fastapi/message_validator.py +0 -345
  231. aiq/front_ends/fastapi/register.py +0 -25
  232. aiq/front_ends/fastapi/response_helpers.py +0 -195
  233. aiq/front_ends/fastapi/step_adaptor.py +0 -321
  234. aiq/front_ends/mcp/__init__.py +0 -14
  235. aiq/front_ends/mcp/mcp_front_end_config.py +0 -32
  236. aiq/front_ends/mcp/mcp_front_end_plugin.py +0 -93
  237. aiq/front_ends/mcp/register.py +0 -27
  238. aiq/front_ends/mcp/tool_converter.py +0 -242
  239. aiq/front_ends/register.py +0 -22
  240. aiq/front_ends/simple_base/__init__.py +0 -14
  241. aiq/front_ends/simple_base/simple_front_end_plugin_base.py +0 -54
  242. aiq/llm/__init__.py +0 -0
  243. aiq/llm/aws_bedrock_llm.py +0 -57
  244. aiq/llm/nim_llm.py +0 -46
  245. aiq/llm/openai_llm.py +0 -46
  246. aiq/llm/register.py +0 -23
  247. aiq/llm/utils/__init__.py +0 -14
  248. aiq/llm/utils/env_config_value.py +0 -94
  249. aiq/llm/utils/error.py +0 -17
  250. aiq/memory/__init__.py +0 -20
  251. aiq/memory/interfaces.py +0 -183
  252. aiq/memory/models.py +0 -112
  253. aiq/meta/module_to_distro.json +0 -3
  254. aiq/meta/pypi.md +0 -58
  255. aiq/object_store/__init__.py +0 -20
  256. aiq/object_store/in_memory_object_store.py +0 -76
  257. aiq/object_store/interfaces.py +0 -84
  258. aiq/object_store/models.py +0 -36
  259. aiq/object_store/register.py +0 -20
  260. aiq/observability/__init__.py +0 -14
  261. aiq/observability/exporter/__init__.py +0 -14
  262. aiq/observability/exporter/base_exporter.py +0 -449
  263. aiq/observability/exporter/exporter.py +0 -78
  264. aiq/observability/exporter/file_exporter.py +0 -33
  265. aiq/observability/exporter/processing_exporter.py +0 -322
  266. aiq/observability/exporter/raw_exporter.py +0 -52
  267. aiq/observability/exporter/span_exporter.py +0 -265
  268. aiq/observability/exporter_manager.py +0 -335
  269. aiq/observability/mixin/__init__.py +0 -14
  270. aiq/observability/mixin/batch_config_mixin.py +0 -26
  271. aiq/observability/mixin/collector_config_mixin.py +0 -23
  272. aiq/observability/mixin/file_mixin.py +0 -288
  273. aiq/observability/mixin/file_mode.py +0 -23
  274. aiq/observability/mixin/resource_conflict_mixin.py +0 -134
  275. aiq/observability/mixin/serialize_mixin.py +0 -61
  276. aiq/observability/mixin/type_introspection_mixin.py +0 -183
  277. aiq/observability/processor/__init__.py +0 -14
  278. aiq/observability/processor/batching_processor.py +0 -309
  279. aiq/observability/processor/callback_processor.py +0 -42
  280. aiq/observability/processor/intermediate_step_serializer.py +0 -28
  281. aiq/observability/processor/processor.py +0 -71
  282. aiq/observability/register.py +0 -96
  283. aiq/observability/utils/__init__.py +0 -14
  284. aiq/observability/utils/dict_utils.py +0 -236
  285. aiq/observability/utils/time_utils.py +0 -31
  286. aiq/plugins/.namespace +0 -1
  287. aiq/profiler/__init__.py +0 -0
  288. aiq/profiler/calc/__init__.py +0 -14
  289. aiq/profiler/calc/calc_runner.py +0 -627
  290. aiq/profiler/calc/calculations.py +0 -288
  291. aiq/profiler/calc/data_models.py +0 -188
  292. aiq/profiler/calc/plot.py +0 -345
  293. aiq/profiler/callbacks/__init__.py +0 -0
  294. aiq/profiler/callbacks/agno_callback_handler.py +0 -295
  295. aiq/profiler/callbacks/base_callback_class.py +0 -20
  296. aiq/profiler/callbacks/langchain_callback_handler.py +0 -290
  297. aiq/profiler/callbacks/llama_index_callback_handler.py +0 -205
  298. aiq/profiler/callbacks/semantic_kernel_callback_handler.py +0 -238
  299. aiq/profiler/callbacks/token_usage_base_model.py +0 -27
  300. aiq/profiler/data_frame_row.py +0 -51
  301. aiq/profiler/data_models.py +0 -24
  302. aiq/profiler/decorators/__init__.py +0 -0
  303. aiq/profiler/decorators/framework_wrapper.py +0 -131
  304. aiq/profiler/decorators/function_tracking.py +0 -254
  305. aiq/profiler/forecasting/__init__.py +0 -0
  306. aiq/profiler/forecasting/config.py +0 -18
  307. aiq/profiler/forecasting/model_trainer.py +0 -75
  308. aiq/profiler/forecasting/models/__init__.py +0 -22
  309. aiq/profiler/forecasting/models/forecasting_base_model.py +0 -40
  310. aiq/profiler/forecasting/models/linear_model.py +0 -196
  311. aiq/profiler/forecasting/models/random_forest_regressor.py +0 -268
  312. aiq/profiler/inference_metrics_model.py +0 -28
  313. aiq/profiler/inference_optimization/__init__.py +0 -0
  314. aiq/profiler/inference_optimization/bottleneck_analysis/__init__.py +0 -0
  315. aiq/profiler/inference_optimization/bottleneck_analysis/nested_stack_analysis.py +0 -460
  316. aiq/profiler/inference_optimization/bottleneck_analysis/simple_stack_analysis.py +0 -258
  317. aiq/profiler/inference_optimization/data_models.py +0 -386
  318. aiq/profiler/inference_optimization/experimental/__init__.py +0 -0
  319. aiq/profiler/inference_optimization/experimental/concurrency_spike_analysis.py +0 -468
  320. aiq/profiler/inference_optimization/experimental/prefix_span_analysis.py +0 -405
  321. aiq/profiler/inference_optimization/llm_metrics.py +0 -212
  322. aiq/profiler/inference_optimization/prompt_caching.py +0 -163
  323. aiq/profiler/inference_optimization/token_uniqueness.py +0 -107
  324. aiq/profiler/inference_optimization/workflow_runtimes.py +0 -72
  325. aiq/profiler/intermediate_property_adapter.py +0 -102
  326. aiq/profiler/profile_runner.py +0 -473
  327. aiq/profiler/utils.py +0 -184
  328. aiq/registry_handlers/__init__.py +0 -0
  329. aiq/registry_handlers/local/__init__.py +0 -0
  330. aiq/registry_handlers/local/local_handler.py +0 -176
  331. aiq/registry_handlers/local/register_local.py +0 -37
  332. aiq/registry_handlers/metadata_factory.py +0 -60
  333. aiq/registry_handlers/package_utils.py +0 -567
  334. aiq/registry_handlers/pypi/__init__.py +0 -0
  335. aiq/registry_handlers/pypi/pypi_handler.py +0 -251
  336. aiq/registry_handlers/pypi/register_pypi.py +0 -40
  337. aiq/registry_handlers/register.py +0 -21
  338. aiq/registry_handlers/registry_handler_base.py +0 -157
  339. aiq/registry_handlers/rest/__init__.py +0 -0
  340. aiq/registry_handlers/rest/register_rest.py +0 -56
  341. aiq/registry_handlers/rest/rest_handler.py +0 -237
  342. aiq/registry_handlers/schemas/__init__.py +0 -0
  343. aiq/registry_handlers/schemas/headers.py +0 -42
  344. aiq/registry_handlers/schemas/package.py +0 -68
  345. aiq/registry_handlers/schemas/publish.py +0 -63
  346. aiq/registry_handlers/schemas/pull.py +0 -82
  347. aiq/registry_handlers/schemas/remove.py +0 -36
  348. aiq/registry_handlers/schemas/search.py +0 -91
  349. aiq/registry_handlers/schemas/status.py +0 -47
  350. aiq/retriever/__init__.py +0 -0
  351. aiq/retriever/interface.py +0 -37
  352. aiq/retriever/milvus/__init__.py +0 -14
  353. aiq/retriever/milvus/register.py +0 -81
  354. aiq/retriever/milvus/retriever.py +0 -228
  355. aiq/retriever/models.py +0 -74
  356. aiq/retriever/nemo_retriever/__init__.py +0 -14
  357. aiq/retriever/nemo_retriever/register.py +0 -60
  358. aiq/retriever/nemo_retriever/retriever.py +0 -190
  359. aiq/retriever/register.py +0 -22
  360. aiq/runtime/__init__.py +0 -14
  361. aiq/runtime/loader.py +0 -215
  362. aiq/runtime/runner.py +0 -190
  363. aiq/runtime/session.py +0 -158
  364. aiq/runtime/user_metadata.py +0 -130
  365. aiq/settings/__init__.py +0 -0
  366. aiq/settings/global_settings.py +0 -318
  367. aiq/test/.namespace +0 -1
  368. aiq/tool/__init__.py +0 -0
  369. aiq/tool/chat_completion.py +0 -74
  370. aiq/tool/code_execution/README.md +0 -151
  371. aiq/tool/code_execution/__init__.py +0 -0
  372. aiq/tool/code_execution/code_sandbox.py +0 -267
  373. aiq/tool/code_execution/local_sandbox/.gitignore +0 -1
  374. aiq/tool/code_execution/local_sandbox/Dockerfile.sandbox +0 -60
  375. aiq/tool/code_execution/local_sandbox/__init__.py +0 -13
  376. aiq/tool/code_execution/local_sandbox/local_sandbox_server.py +0 -198
  377. aiq/tool/code_execution/local_sandbox/sandbox.requirements.txt +0 -6
  378. aiq/tool/code_execution/local_sandbox/start_local_sandbox.sh +0 -50
  379. aiq/tool/code_execution/register.py +0 -74
  380. aiq/tool/code_execution/test_code_execution_sandbox.py +0 -414
  381. aiq/tool/code_execution/utils.py +0 -100
  382. aiq/tool/datetime_tools.py +0 -42
  383. aiq/tool/document_search.py +0 -141
  384. aiq/tool/github_tools/__init__.py +0 -0
  385. aiq/tool/github_tools/create_github_commit.py +0 -133
  386. aiq/tool/github_tools/create_github_issue.py +0 -87
  387. aiq/tool/github_tools/create_github_pr.py +0 -106
  388. aiq/tool/github_tools/get_github_file.py +0 -106
  389. aiq/tool/github_tools/get_github_issue.py +0 -166
  390. aiq/tool/github_tools/get_github_pr.py +0 -256
  391. aiq/tool/github_tools/update_github_issue.py +0 -100
  392. aiq/tool/mcp/__init__.py +0 -14
  393. aiq/tool/mcp/exceptions.py +0 -142
  394. aiq/tool/mcp/mcp_client.py +0 -255
  395. aiq/tool/mcp/mcp_tool.py +0 -96
  396. aiq/tool/memory_tools/__init__.py +0 -0
  397. aiq/tool/memory_tools/add_memory_tool.py +0 -79
  398. aiq/tool/memory_tools/delete_memory_tool.py +0 -67
  399. aiq/tool/memory_tools/get_memory_tool.py +0 -72
  400. aiq/tool/nvidia_rag.py +0 -95
  401. aiq/tool/register.py +0 -38
  402. aiq/tool/retriever.py +0 -89
  403. aiq/tool/server_tools.py +0 -66
  404. aiq/utils/__init__.py +0 -0
  405. aiq/utils/data_models/__init__.py +0 -0
  406. aiq/utils/data_models/schema_validator.py +0 -58
  407. aiq/utils/debugging_utils.py +0 -43
  408. aiq/utils/dump_distro_mapping.py +0 -32
  409. aiq/utils/exception_handlers/__init__.py +0 -0
  410. aiq/utils/exception_handlers/automatic_retries.py +0 -289
  411. aiq/utils/exception_handlers/mcp.py +0 -211
  412. aiq/utils/exception_handlers/schemas.py +0 -114
  413. aiq/utils/io/__init__.py +0 -0
  414. aiq/utils/io/model_processing.py +0 -28
  415. aiq/utils/io/yaml_tools.py +0 -119
  416. aiq/utils/log_utils.py +0 -37
  417. aiq/utils/metadata_utils.py +0 -74
  418. aiq/utils/optional_imports.py +0 -142
  419. aiq/utils/producer_consumer_queue.py +0 -178
  420. aiq/utils/reactive/__init__.py +0 -0
  421. aiq/utils/reactive/base/__init__.py +0 -0
  422. aiq/utils/reactive/base/observable_base.py +0 -65
  423. aiq/utils/reactive/base/observer_base.py +0 -55
  424. aiq/utils/reactive/base/subject_base.py +0 -79
  425. aiq/utils/reactive/observable.py +0 -59
  426. aiq/utils/reactive/observer.py +0 -76
  427. aiq/utils/reactive/subject.py +0 -131
  428. aiq/utils/reactive/subscription.py +0 -49
  429. aiq/utils/settings/__init__.py +0 -0
  430. aiq/utils/settings/global_settings.py +0 -197
  431. aiq/utils/string_utils.py +0 -38
  432. aiq/utils/type_converter.py +0 -290
  433. aiq/utils/type_utils.py +0 -484
  434. aiq/utils/url_utils.py +0 -27
  435. aiqtoolkit-1.2.0rc4.dist-info/METADATA +0 -363
  436. aiqtoolkit-1.2.0rc4.dist-info/RECORD +0 -438
  437. aiqtoolkit-1.2.0rc4.dist-info/entry_points.txt +0 -20
  438. aiqtoolkit-1.2.0rc4.dist-info/licenses/LICENSE-3rd-party.txt +0 -3686
  439. aiqtoolkit-1.2.0rc4.dist-info/licenses/LICENSE.md +0 -201
  440. aiqtoolkit-1.2.0rc4.dist-info/top_level.txt +0 -1
  441. {aiqtoolkit-1.2.0rc4.dist-info → aiqtoolkit-1.2.0rc5.dist-info}/WHEEL +0 -0
@@ -1,108 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
15
-
16
- import asyncio
17
- import logging
18
- from contextlib import AsyncExitStack
19
- from pathlib import Path
20
-
21
- import click
22
-
23
- from aiq.data_models.registry_handler import RegistryHandlerBaseConfig
24
- from aiq.utils.data_models.schema_validator import validate_yaml
25
-
26
- logger = logging.getLogger(__name__)
27
-
28
-
29
- async def remove_artifact(registry_handler_config: RegistryHandlerBaseConfig, packages: list[dict[str, str]]) -> None:
30
-
31
- from aiq.cli.type_registry import GlobalTypeRegistry
32
- from aiq.registry_handlers.schemas.package import PackageNameVersionList
33
-
34
- registry = GlobalTypeRegistry.get()
35
-
36
- async with AsyncExitStack() as stack:
37
-
38
- registry_handler_info = registry.get_registry_handler(type(registry_handler_config))
39
- registry_handler = await stack.enter_async_context(registry_handler_info.build_fn(registry_handler_config))
40
-
41
- try:
42
- package_name_list = PackageNameVersionList(**{"packages": packages})
43
- except Exception as e:
44
- logger.exception("Invalid package format: '%s'", e, exc_info=True)
45
-
46
- await stack.enter_async_context(registry_handler.remove(packages=package_name_list))
47
-
48
-
49
- @click.group(name=__name__,
50
- invoke_without_command=True,
51
- help=("Remove AIQ Toolkit artifact from a remote registry by name and version."))
52
- @click.argument("packages", type=str)
53
- @click.option(
54
- "--config_file",
55
- type=click.Path(exists=True, file_okay=True, dir_okay=False, path_type=Path),
56
- callback=validate_yaml,
57
- required=False,
58
- help=("A YAML file to override the channel settings."),
59
- )
60
- @click.option(
61
- "-c",
62
- "--channel",
63
- type=str,
64
- required=True,
65
- help=("The remote registry channel that will remove the AIQ Toolkit artifact."),
66
- )
67
- def remove(channel: str, config_file: str, packages: str) -> None:
68
- """
69
- Remove AIQ Toolkit artifacts from a remote registry.
70
- """
71
-
72
- from aiq.settings.global_settings import GlobalSettings
73
-
74
- # Extract package name and version
75
- packages = packages.split()
76
- packages_versions = []
77
- for package in packages:
78
- package_dict = {}
79
- package_version = package.split("==")
80
- if (len(package_version) == 1):
81
- package_dict["name"] = package_version[0]
82
- msg = f"No package version provided for '{package_version[0]}'."
83
- logger.warning(msg)
84
- elif (len(package_version) == 2):
85
- package_dict["name"] = package_version[0]
86
- package_dict["version"] = package_version[1]
87
- else:
88
- msg = f"Invalid input: '{package}'"
89
- logger.error(msg)
90
- if (package_dict):
91
- packages_versions.append(package_dict)
92
-
93
- settings = GlobalSettings().get()
94
-
95
- if (config_file is not None):
96
- settings = settings.override_settings(config_file)
97
-
98
- try:
99
- remove_channel_config = settings.channels.get(channel)
100
-
101
- if (remove_channel_config is None):
102
- logger.error("Remove channel '%s' has not been configured.", channel)
103
- return
104
- except Exception as e:
105
- logger.exception("Error loading user settings: %s", e, exc_info=True)
106
- return
107
-
108
- asyncio.run(remove_artifact(registry_handler_config=remove_channel_config, packages=packages_versions))
@@ -1,155 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
15
-
16
- import asyncio
17
- import logging
18
- from contextlib import AsyncExitStack
19
- from pathlib import Path
20
-
21
- import click
22
-
23
- from aiq.data_models.component import AIQComponentEnum
24
- from aiq.data_models.registry_handler import RegistryHandlerBaseConfig
25
- from aiq.registry_handlers.schemas.search import SearchFields
26
- from aiq.registry_handlers.schemas.status import StatusEnum
27
- from aiq.utils.data_models.schema_validator import validate_yaml
28
-
29
- logger = logging.getLogger(__name__)
30
-
31
-
32
- async def search_artifacts( # pylint: disable=R0917
33
- registry_handler_config: RegistryHandlerBaseConfig,
34
- query: str,
35
- search_fields: list[SearchFields],
36
- visualize: bool,
37
- component_types: list[AIQComponentEnum],
38
- save_path: str | None = None,
39
- n_results: int = 10) -> None:
40
-
41
- from aiq.cli.type_registry import GlobalTypeRegistry
42
- from aiq.registry_handlers.schemas.search import SearchQuery
43
-
44
- registry = GlobalTypeRegistry.get()
45
-
46
- async with AsyncExitStack() as stack:
47
-
48
- registry_handler_info = registry.get_registry_handler(type(registry_handler_config))
49
- registry_handler = await stack.enter_async_context(registry_handler_info.build_fn(registry_handler_config))
50
-
51
- if (len(component_types) == 0):
52
- component_types = [t.value for t in AIQComponentEnum]
53
-
54
- query = SearchQuery(query=query, fields=search_fields, top_k=n_results, component_types=component_types)
55
-
56
- search_response = await stack.enter_async_context(registry_handler.search(query=query))
57
-
58
- if (search_response.status.status == StatusEnum.SUCCESS):
59
- if (visualize):
60
- registry_handler.visualize_search_results(search_response=search_response)
61
- if (save_path is not None):
62
- registry_handler.save_search_results(search_response=search_response, save_path=save_path)
63
-
64
-
65
- @click.group(name=__name__, invoke_without_command=True, help="Search for AIQ Toolkit artifacts from remote registry.")
66
- @click.option(
67
- "--config_file",
68
- type=click.Path(exists=True, file_okay=True, dir_okay=False, path_type=Path),
69
- callback=validate_yaml,
70
- required=False,
71
- help=("A JSON/YAML file that sets the parameters for the workflow."),
72
- )
73
- @click.option(
74
- "-c",
75
- "--channel",
76
- type=str,
77
- required=True,
78
- help=("The remote registry channel to use when pulling the AIQ Toolkit artifact."),
79
- )
80
- @click.option(
81
- "-o",
82
- "--output_path",
83
- type=str,
84
- required=False,
85
- help=("Path to save search results."),
86
- )
87
- @click.option(
88
- "-f",
89
- "--fields",
90
- multiple=True,
91
- type=click.Choice([e.value for e in SearchFields], case_sensitive=False),
92
- required=False,
93
- help=("The fields to include in the search."),
94
- )
95
- @click.option(
96
- "-q",
97
- "--query",
98
- type=str,
99
- required=True,
100
- help=("The query string."),
101
- )
102
- @click.option(
103
- "-n",
104
- "--n_results",
105
- type=int,
106
- required=False,
107
- default=10,
108
- help=("Number of search results to return."),
109
- )
110
- @click.option(
111
- "-t",
112
- "--types",
113
- "component_types",
114
- multiple=True,
115
- type=click.Choice([e.value for e in AIQComponentEnum], case_sensitive=False),
116
- required=False,
117
- help=("The component types to include in search."),
118
- )
119
- def search( # pylint: disable=R0917
120
- config_file: str,
121
- channel: str,
122
- fields: list[str],
123
- query: str,
124
- component_types: list[AIQComponentEnum],
125
- n_results: int,
126
- output_path: str) -> None:
127
- """
128
- Search for AIQ Toolkit artifacts with the specified configuration.
129
- """
130
-
131
- from aiq.settings.global_settings import GlobalSettings
132
-
133
- settings = GlobalSettings().get()
134
-
135
- if (config_file is not None):
136
- settings = settings.override_settings(config_file)
137
-
138
- try:
139
- search_channel_config = settings.channels.get(channel)
140
-
141
- if (search_channel_config is None):
142
- logger.error("Search channel '%s' has not been configured.", channel)
143
- return
144
- except Exception as e:
145
- logger.exception("Error loading user settings: %s", e, exc_info=True)
146
- return
147
-
148
- asyncio.run(
149
- search_artifacts(registry_handler_config=search_channel_config,
150
- query=query,
151
- component_types=component_types,
152
- search_fields=fields,
153
- visualize=True,
154
- save_path=output_path,
155
- n_results=n_results))
@@ -1,14 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
@@ -1,297 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
15
-
16
- import asyncio
17
- import logging
18
- from pathlib import Path
19
-
20
- import click
21
- from tabulate import tabulate
22
-
23
- from aiq.profiler.calc.calc_runner import CalcRunner
24
- from aiq.profiler.calc.data_models import CalcRunnerConfig
25
- from aiq.profiler.calc.data_models import CalcRunnerOutput
26
-
27
- logger = logging.getLogger(__name__)
28
-
29
-
30
- @click.command("calc", help="Estimate GPU count and plot metrics for a workflow")
31
- @click.option(
32
- "--config_file",
33
- type=click.Path(exists=True, file_okay=True, dir_okay=False, path_type=Path),
34
- required=False,
35
- default=None,
36
- help="A YAML config file for the workflow and evaluation. This is not needed in offline mode.",
37
- )
38
- @click.option(
39
- "--offline_mode",
40
- is_flag=True,
41
- required=False,
42
- default=False,
43
- help="Run in offline mode. This is used to estimate the GPU count for a workflow without running the workflow. ")
44
- @click.option(
45
- "--target_llm_latency",
46
- type=float,
47
- required=False,
48
- default=0,
49
- help="Target p95 LLM latency (seconds). Can be set to 0 to ignore.",
50
- )
51
- @click.option(
52
- "--target_workflow_runtime",
53
- type=float,
54
- required=False,
55
- default=0,
56
- help="Target p95 workflow runtime (seconds). Can be set to 0 to ignore.",
57
- )
58
- @click.option(
59
- "--target_users",
60
- type=int,
61
- required=False,
62
- default=0,
63
- help="Target number of users to support.",
64
- )
65
- @click.option(
66
- "--test_gpu_count",
67
- type=int,
68
- required=False,
69
- default=0,
70
- help="Number of GPUs used in the test.",
71
- )
72
- @click.option(
73
- "--calc_output_dir",
74
- type=click.Path(file_okay=False, dir_okay=True, path_type=Path),
75
- required=False,
76
- default=None,
77
- help="Directory to save plots and results (optional).",
78
- )
79
- @click.option(
80
- "--concurrencies",
81
- type=str,
82
- required=False,
83
- default="1,2,3,4,5,6,7,8,9,10",
84
- help="Comma-separated list of concurrency values to test (e.g., 1,2,4,8). Default: 1,2,3,4,5,6,7,8,9,10",
85
- )
86
- @click.option(
87
- "--num_passes",
88
- type=int,
89
- required=False,
90
- default=0,
91
- help="Number of passes at each concurrency for the evaluation."
92
- " If set to 0 the dataset is adjusted to a multiple of the concurrency. Default: 0",
93
- )
94
- @click.option(
95
- "--append_calc_outputs",
96
- is_flag=True,
97
- required=False,
98
- default=False,
99
- help="Append calc outputs to the output directory. "
100
- "By default append is set to False and the content of the online directory is overwritten.",
101
- )
102
- @click.option(
103
- "--endpoint",
104
- type=str,
105
- required=False,
106
- default=None,
107
- help="Endpoint to use for the workflow if it is remote(optional).",
108
- )
109
- @click.option(
110
- "--endpoint_timeout",
111
- type=int,
112
- required=False,
113
- default=300,
114
- help="Timeout for the remote workflow endpoint in seconds (default: 300).",
115
- )
116
- @click.pass_context
117
- def calc_command(ctx,
118
- config_file,
119
- offline_mode,
120
- target_llm_latency,
121
- target_workflow_runtime,
122
- target_users,
123
- test_gpu_count,
124
- calc_output_dir,
125
- concurrencies,
126
- num_passes,
127
- append_calc_outputs,
128
- endpoint,
129
- endpoint_timeout):
130
- """Estimate GPU count and plot metrics for a workflow profile."""
131
- # Only use CLI concurrencies, with default
132
- concurrencies_list = [int(x) for x in concurrencies.split(",") if x.strip()]
133
-
134
- # Dont allow a concurrency of 0
135
- if 0 in concurrencies_list:
136
- click.echo("Concurrency of 0 is not allowed.")
137
- return
138
-
139
- # Check if the parameters are valid in online and offline mode
140
- if offline_mode:
141
- # In offline mode target test parameters are needed to estimate the GPU count
142
- if target_llm_latency == 0 and target_workflow_runtime == 0:
143
- click.echo("Both --target_llm_latency and --target_workflow_runtime are 0. "
144
- "Cannot estimate the GPU count.")
145
- return
146
- if test_gpu_count <= 0:
147
- click.echo("Test GPU count is 0. Cannot estimate the GPU count.")
148
- return
149
- if target_users <= 0:
150
- click.echo("Target users is 0. Cannot estimate the GPU count.")
151
- return
152
- if append_calc_outputs:
153
- click.echo("Appending calc outputs is not supported in offline mode.")
154
- return
155
- if not calc_output_dir:
156
- click.echo("Output directory is required in offline mode.")
157
- return
158
- else:
159
- if not config_file:
160
- click.echo("Config file is required in online mode.")
161
- return
162
- if target_llm_latency == 0 and target_workflow_runtime == 0:
163
- click.echo("Both --target_llm_latency and --target_workflow_runtime are 0. "
164
- "GPU count will not be estimated.")
165
- if test_gpu_count <= 0:
166
- click.echo("Test GPU count is 0. Tests will be run but the GPU count will not be estimated.")
167
- if target_users <= 0:
168
- click.echo("Target users is 0. Tests will be run but the GPU count will not be estimated.")
169
-
170
- # Build CalcRunnerConfig
171
- runner_config = CalcRunnerConfig(
172
- config_file=config_file,
173
- concurrencies=concurrencies_list,
174
- target_llm_latency_p95=target_llm_latency,
175
- target_workflow_runtime_p95=target_workflow_runtime,
176
- target_users=target_users,
177
- test_gpu_count=test_gpu_count,
178
- output_dir=calc_output_dir,
179
- num_passes=num_passes,
180
- offline_mode=offline_mode,
181
- append_job=append_calc_outputs,
182
- endpoint=endpoint,
183
- endpoint_timeout=endpoint_timeout,
184
- )
185
-
186
- async def run_calc() -> CalcRunnerOutput:
187
- runner = CalcRunner(runner_config)
188
- result = await runner.run()
189
- return result
190
-
191
- def print_results(results: CalcRunnerOutput):
192
-
193
- # Print header with target numbers
194
- click.echo(f"Targets: LLM Latency ≤ {runner_config.target_llm_latency_p95}s, "
195
- f"Workflow Runtime ≤ {runner_config.target_workflow_runtime_p95}s, "
196
- f"Users = {runner_config.target_users}")
197
- click.echo(f"Test parameters: GPUs = {runner_config.test_gpu_count}")
198
-
199
- # Check if there are any GPU estimates to determine if we should show GPU estimate columns
200
- has_llm_latency_gpu_estimates = any(data.gpu_estimates.gpu_estimate_by_llm_latency is not None
201
- for data in results.calc_data.values())
202
- has_wf_runtime_gpu_estimates = any(data.gpu_estimates.gpu_estimate_by_wf_runtime is not None
203
- for data in results.calc_data.values())
204
-
205
- # Check if there are any interrupted workflows or outliers to determine if we should show the alerts column
206
- has_alerts = any(data.sizing_metrics.alerts.workflow_interrupted or data.alerts.outlier_llm_latency
207
- or data.alerts.outlier_workflow_runtime for data in results.calc_data.values())
208
-
209
- # Print per concurrency results as a table
210
- click.echo("Per concurrency results:")
211
-
212
- # Show alerts legend if there are any alerts
213
- if has_alerts:
214
- click.echo("Alerts!: W = Workflow interrupted, L = LLM latency outlier, R = Workflow runtime outlier")
215
-
216
- table = []
217
- for concurrency, data in results.calc_data.items():
218
- metrics = data.sizing_metrics
219
- gpu_estimates_per_concurrency = data.gpu_estimates
220
- sizing_metrics_alerts = data.sizing_metrics.alerts
221
- calc_alerts = data.alerts
222
-
223
- row = []
224
-
225
- # Only include alerts column if there are any interrupted workflows (first column)
226
- if has_alerts:
227
- alerts = []
228
- if sizing_metrics_alerts.workflow_interrupted:
229
- alerts.append("W")
230
- if calc_alerts.outlier_llm_latency:
231
- alerts.append("L")
232
- if calc_alerts.outlier_workflow_runtime:
233
- alerts.append("R")
234
-
235
- # Show ! followed by all alert characters
236
- if alerts:
237
- row.append(f"!{''.join(alerts)}")
238
- else:
239
- row.append("")
240
-
241
- row.extend([
242
- concurrency,
243
- metrics.llm_latency_p95,
244
- metrics.workflow_runtime_p95,
245
- metrics.total_runtime,
246
- ])
247
-
248
- # Only include GPU estimate columns if there are actual estimates of that type
249
- if has_llm_latency_gpu_estimates:
250
- row.append(gpu_estimates_per_concurrency.gpu_estimate_by_llm_latency)
251
- if has_wf_runtime_gpu_estimates:
252
- row.append(gpu_estimates_per_concurrency.gpu_estimate_by_wf_runtime)
253
-
254
- table.append(row)
255
-
256
- headers = []
257
-
258
- # Only include alerts header if there are any alerts (first column)
259
- if has_alerts:
260
- headers.append("Alerts")
261
-
262
- headers.extend([
263
- "Concurrency",
264
- "p95 LLM Latency",
265
- "p95 WF Runtime",
266
- "Total Runtime",
267
- ])
268
-
269
- # Only include GPU estimate headers if there are actual estimates of that type
270
- if has_llm_latency_gpu_estimates:
271
- headers.append("GPUs (LLM Latency, Rough)")
272
- if has_wf_runtime_gpu_estimates:
273
- headers.append("GPUs (WF Runtime, Rough)")
274
-
275
- click.echo(tabulate(table, headers=headers, tablefmt="github"))
276
-
277
- # Display slope-based GPU estimates if they are available
278
- if results.gpu_estimates.gpu_estimate_by_llm_latency is not None or \
279
- results.gpu_estimates.gpu_estimate_by_wf_runtime is not None:
280
- click.echo("")
281
- click.echo(click.style("=== GPU ESTIMATES ===", fg="bright_blue", bold=True))
282
-
283
- if results.gpu_estimates.gpu_estimate_by_wf_runtime is not None:
284
- click.echo(
285
- click.style(
286
- f"Estimated GPU count (Workflow Runtime): {results.gpu_estimates.gpu_estimate_by_wf_runtime:.1f}",
287
- fg="green",
288
- bold=True))
289
- if results.gpu_estimates.gpu_estimate_by_llm_latency is not None:
290
- click.echo(
291
- click.style(
292
- f"Estimated GPU count (LLM Latency): {results.gpu_estimates.gpu_estimate_by_llm_latency:.1f}",
293
- fg="green",
294
- bold=True))
295
-
296
- results = asyncio.run(run_calc())
297
- print_results(results)
@@ -1,27 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
- # SPDX-License-Identifier: Apache-2.0
3
- #
4
- # Licensed under the Apache License, Version 2.0 (the "License");
5
- # you may not use this file except in compliance with the License.
6
- # You may obtain a copy of the License at
7
- #
8
- # http://www.apache.org/licenses/LICENSE-2.0
9
- #
10
- # Unless required by applicable law or agreed to in writing, software
11
- # distributed under the License is distributed on an "AS IS" BASIS,
12
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- # See the License for the specific language governing permissions and
14
- # limitations under the License.
15
-
16
- import click
17
-
18
- from .calc import calc_command
19
-
20
-
21
- @click.group(help="Size GPU clusters for workflows with the specified options.")
22
- def sizing():
23
- """Sizing-related commands."""
24
- pass
25
-
26
-
27
- sizing.add_command(calc_command)