mlx-stack 0.3.4__tar.gz → 0.3.6__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (244) hide show
  1. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.github/workflows/ci.yml +3 -0
  2. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.github/workflows/integration-nightly.yml +3 -0
  3. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.github/workflows/integration-prerelease.yml +3 -0
  4. mlx_stack-0.3.6/.release-please-manifest.json +3 -0
  5. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/CHANGELOG.md +24 -0
  6. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/Makefile +3 -2
  7. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/PKG-INFO +44 -17
  8. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/README.md +43 -16
  9. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/pyproject.toml +34 -1
  10. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/_version.py +2 -2
  11. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/bench.py +7 -12
  12. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/config.py +1 -3
  13. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/init.py +3 -7
  14. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/install.py +1 -3
  15. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/logs.py +3 -5
  16. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/models.py +5 -3
  17. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/profile.py +2 -6
  18. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/pull.py +4 -11
  19. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/recommend.py +8 -21
  20. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/setup.py +29 -32
  21. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/up.py +4 -12
  22. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/watch.py +6 -14
  23. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/benchmark.py +14 -25
  24. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/catalog.py +14 -35
  25. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/config.py +10 -8
  26. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/deps.py +5 -16
  27. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/discovery.py +13 -11
  28. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/hardware.py +1 -1
  29. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/launchd.py +6 -19
  30. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/litellm_gen.py +1 -3
  31. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/log_rotation.py +4 -9
  32. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/log_viewer.py +6 -9
  33. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/models.py +36 -35
  34. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/onboarding.py +55 -48
  35. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/process.py +9 -20
  36. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/pull.py +11 -24
  37. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/scoring.py +29 -21
  38. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/stack_down.py +9 -9
  39. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/stack_init.py +17 -16
  40. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/stack_status.py +29 -24
  41. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/stack_up.py +100 -94
  42. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/watchdog.py +6 -11
  43. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/conftest.py +2 -2
  44. mlx_stack-0.3.6/tests/factories.py +298 -0
  45. mlx_stack-0.3.6/tests/fakes.py +190 -0
  46. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/integration/conftest.py +27 -24
  47. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/integration/report.py +3 -3
  48. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/integration/test_catalog_validation.py +8 -11
  49. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/integration/test_harness_compatibility.py +8 -12
  50. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/integration/test_inference_e2e.py +8 -15
  51. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/integration/test_launchd_e2e.py +12 -28
  52. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/integration/test_model_smoke.py +2 -5
  53. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/integration/test_stack_integration.py +7 -16
  54. mlx_stack-0.3.6/tests/unit/conftest.py +106 -0
  55. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_benchmark.py +48 -46
  56. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_catalog.py +27 -15
  57. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli.py +8 -4
  58. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_bench.py +58 -25
  59. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_down.py +195 -142
  60. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_init.py +333 -273
  61. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_install.py +14 -38
  62. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_logs.py +32 -47
  63. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_models.py +104 -146
  64. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_profile.py +28 -84
  65. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_pull.py +289 -112
  66. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_recommend.py +214 -186
  67. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_setup.py +51 -36
  68. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_status.py +176 -161
  69. mlx_stack-0.3.6/tests/unit/test_cli_up.py +1148 -0
  70. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_watch.py +14 -23
  71. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_config.py +4 -7
  72. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cross_area.py +86 -150
  73. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_deps.py +16 -35
  74. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_discovery.py +4 -2
  75. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_hardware.py +5 -8
  76. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_launchd.py +14 -30
  77. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_lifecycle_fixes.py +66 -168
  78. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_litellm_gen.py +3 -12
  79. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_log_rotation.py +27 -27
  80. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_log_viewer.py +51 -68
  81. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_models.py +17 -49
  82. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_onboarding.py +109 -37
  83. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_ops_cross_area.py +151 -99
  84. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_paths.py +1 -3
  85. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_process.py +23 -20
  86. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_robustness_fixes.py +56 -86
  87. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_scoring.py +139 -260
  88. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_watchdog.py +199 -98
  89. mlx_stack-0.3.4/.release-please-manifest.json +0 -3
  90. mlx_stack-0.3.4/tests/unit/test_cli_up.py +0 -1584
  91. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/init.sh +0 -0
  92. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/library/architecture.md +0 -0
  93. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/library/environment.md +0 -0
  94. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/library/user-testing.md +0 -0
  95. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/services.yaml +0 -0
  96. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/settings.json +0 -0
  97. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/skills/cli-feature/SKILL.md +0 -0
  98. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/scrutiny/reviews/configuration-management.json +0 -0
  99. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/scrutiny/reviews/dependency-management.json +0 -0
  100. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/scrutiny/reviews/fix-catalog-errors-and-families.json +0 -0
  101. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/scrutiny/reviews/fix-deps-binary-and-ansi.json +0 -0
  102. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/scrutiny/reviews/fix-scaffolding-data-home.json +0 -0
  103. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/scrutiny/reviews/hardware-detection.json +0 -0
  104. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/scrutiny/reviews/model-catalog.json +0 -0
  105. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/scrutiny/reviews/project-scaffolding.json +0 -0
  106. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/scrutiny/synthesis.json +0 -0
  107. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/scrutiny/synthesis.round1.json +0 -0
  108. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/user-testing/flows/foundation-config-basic.json +0 -0
  109. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/user-testing/flows/foundation-config-deps.json +0 -0
  110. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/user-testing/flows/foundation-profile-catalog.json +0 -0
  111. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/user-testing/flows/foundation-setup-profile-core.json +0 -0
  112. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/foundation/user-testing/synthesis.json +0 -0
  113. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/scrutiny/reviews/down-command.json +0 -0
  114. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/scrutiny/reviews/fix-lifecycle-preflight-and-readonly.json +0 -0
  115. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/scrutiny/reviews/fix-lifecycle-process-robustness.json +0 -0
  116. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/scrutiny/reviews/fix-lifecycle-typecheck.json +0 -0
  117. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/scrutiny/reviews/process-management.json +0 -0
  118. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/scrutiny/reviews/status-command.json +0 -0
  119. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/scrutiny/reviews/up-command.json +0 -0
  120. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/scrutiny/synthesis.json +0 -0
  121. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/scrutiny/synthesis.round1.json +0 -0
  122. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/user-testing/flows/r1-g1-deps-up-basics.json +0 -0
  123. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/user-testing/flows/r1-g2-up-startup.json +0 -0
  124. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/user-testing/flows/r1-g3-up-resilience.json +0 -0
  125. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/user-testing/flows/r1-g4-down.json +0 -0
  126. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/user-testing/flows/r1-g5-status.json +0 -0
  127. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/user-testing/flows/r1-g6-cross.json +0 -0
  128. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/user-testing/flows/r2-g1-fixes.json +0 -0
  129. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/user-testing/flows/r2-g2-cross-blockers.json +0 -0
  130. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/user-testing/synthesis.json +0 -0
  131. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/lifecycle/user-testing/synthesis.round1.json +0 -0
  132. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/misc-cross-area/scrutiny/reviews/fix-cross-area-test-rigor.json +0 -0
  133. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/misc-cross-area/scrutiny/reviews/misc-cross-area-validation.json +0 -0
  134. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/misc-cross-area/scrutiny/synthesis.json +0 -0
  135. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/misc-cross-area/scrutiny/synthesis.round1.json +0 -0
  136. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/misc-cross-area/user-testing/flows/r1-g1-cross-flows.json +0 -0
  137. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/misc-cross-area/user-testing/flows/r2-g4-cross-port5050.json +0 -0
  138. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/misc-cross-area/user-testing/synthesis.json +0 -0
  139. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/misc-cross-area/user-testing/synthesis.round1.json +0 -0
  140. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/scrutiny/reviews/fix-ops-lint-errors.json +0 -0
  141. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/scrutiny/reviews/fix-ops-scrutiny-issues.json +0 -0
  142. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/scrutiny/reviews/fix-ops-typecheck-errors.json +0 -0
  143. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/scrutiny/reviews/launchd-integration.json +0 -0
  144. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/scrutiny/reviews/log-rotation.json +0 -0
  145. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/scrutiny/reviews/logs-command.json +0 -0
  146. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/scrutiny/reviews/ops-cross-area-validation.json +0 -0
  147. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/scrutiny/reviews/watchdog-command.json +0 -0
  148. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/scrutiny/synthesis.json +0 -0
  149. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/scrutiny/synthesis.round1.json +0 -0
  150. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/user-testing/flows/g1-log.json +0 -0
  151. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/user-testing/flows/g2-logs-command.json +0 -0
  152. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/user-testing/flows/g3-watch.json +0 -0
  153. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/user-testing/flows/g4-launchd.json +0 -0
  154. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/user-testing/flows/g5-cross-ops.json +0 -0
  155. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/ops/user-testing/synthesis.json +0 -0
  156. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/public-ready/scrutiny/reviews/community-docs.json +0 -0
  157. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/public-ready/scrutiny/reviews/developing-guide.json +0 -0
  158. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/public-ready/scrutiny/reviews/fix-public-ready-scrutiny.json +0 -0
  159. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/public-ready/scrutiny/reviews/github-actions-ci.json +0 -0
  160. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/public-ready/scrutiny/reviews/readme-rewrite.json +0 -0
  161. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/public-ready/scrutiny/synthesis.json +0 -0
  162. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/public-ready/scrutiny/synthesis.round1.json +0 -0
  163. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/scrutiny/reviews/fix-init-and-models-issues.json +0 -0
  164. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/scrutiny/reviews/fix-recommendation-scoring-issues.json +0 -0
  165. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/scrutiny/reviews/fix-scoring-lint.json +0 -0
  166. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/scrutiny/reviews/init-command.json +0 -0
  167. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/scrutiny/reviews/models-command.json +0 -0
  168. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/scrutiny/reviews/recommend-command.json +0 -0
  169. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/scrutiny/reviews/scoring-engine.json +0 -0
  170. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/scrutiny/synthesis.json +0 -0
  171. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/scrutiny/synthesis.round1.json +0 -0
  172. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/user-testing/flows/g1-recommend-budget-ranking.json +0 -0
  173. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/user-testing/flows/g2-recommend-output-integration.json +0 -0
  174. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/user-testing/flows/g3-init-core-routing.json +0 -0
  175. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/user-testing/flows/g4-init-cloud-overwrite.json +0 -0
  176. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/user-testing/flows/g5-init-hardware-summary.json +0 -0
  177. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/user-testing/flows/g6-models-local.json +0 -0
  178. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/user-testing/flows/g7-models-catalog.json +0 -0
  179. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/user-testing/flows/r2-g1-recommend.json +0 -0
  180. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/user-testing/flows/r2-g2-models-catalog-filters.json +0 -0
  181. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/user-testing/flows/r2-g3-cross-012.json +0 -0
  182. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/user-testing/synthesis.json +0 -0
  183. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/recommendation/user-testing/synthesis.round1.json +0 -0
  184. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/scrutiny/reviews/bench-command.json +0 -0
  185. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/scrutiny/reviews/fix-tooling-scrutiny-issues.json +0 -0
  186. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/scrutiny/reviews/pull-command.json +0 -0
  187. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/scrutiny/synthesis.json +0 -0
  188. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/scrutiny/synthesis.round1.json +0 -0
  189. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/flows/g1-pull-core.json +0 -0
  190. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/flows/g2-pull-errors.json +0 -0
  191. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/flows/g3-bench-core.json +0 -0
  192. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/flows/g4-bench-advanced.json +0 -0
  193. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/flows/r2-g1-pull.json +0 -0
  194. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/flows/r2-g2-bench.json +0 -0
  195. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/flows/r3-g1-pull.json +0 -0
  196. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/flows/r3-g2-bench.json +0 -0
  197. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/flows/r4-g1-bench.json +0 -0
  198. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/synthesis.json +0 -0
  199. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/synthesis.round1.json +0 -0
  200. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/synthesis.round2.json +0 -0
  201. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.factory/validation/tooling/user-testing/synthesis.round3.json +0 -0
  202. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.github/release.yml +0 -0
  203. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.github/workflows/publish.yml +0 -0
  204. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.github/workflows/release-please.yml +0 -0
  205. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/.gitignore +0 -0
  206. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/CODE_OF_CONDUCT.md +0 -0
  207. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/CONTRIBUTING.md +0 -0
  208. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/DEVELOPING.md +0 -0
  209. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/LICENSE +0 -0
  210. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/SECURITY.md +0 -0
  211. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/release-please-config.json +0 -0
  212. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/__init__.py +0 -0
  213. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/__init__.py +0 -0
  214. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/down.py +0 -0
  215. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/main.py +0 -0
  216. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/cli/status.py +0 -0
  217. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/__init__.py +0 -0
  218. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/core/paths.py +0 -0
  219. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/__init__.py +0 -0
  220. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/benchmark_data.json +0 -0
  221. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/__init__.py +0 -0
  222. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/deepseek-r1-32b.yaml +0 -0
  223. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/deepseek-r1-8b.yaml +0 -0
  224. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/gemma3-12b.yaml +0 -0
  225. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/gemma3-27b.yaml +0 -0
  226. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/gemma3-4b.yaml +0 -0
  227. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/llama3.3-8b.yaml +0 -0
  228. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/nemotron-49b.yaml +0 -0
  229. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/nemotron-8b.yaml +0 -0
  230. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/qwen3-8b.yaml +0 -0
  231. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/qwen3.5-0.8b.yaml +0 -0
  232. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/qwen3.5-14b.yaml +0 -0
  233. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/qwen3.5-32b.yaml +0 -0
  234. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/qwen3.5-3b.yaml +0 -0
  235. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/qwen3.5-72b.yaml +0 -0
  236. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/data/catalog/qwen3.5-8b.yaml +0 -0
  237. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/py.typed +0 -0
  238. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/src/mlx_stack/utils/__init__.py +0 -0
  239. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/__init__.py +0 -0
  240. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/integration/__init__.py +0 -0
  241. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/__init__.py +0 -0
  242. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_cli_config.py +0 -0
  243. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/tests/unit/test_data_dir.py +0 -0
  244. {mlx_stack-0.3.4 → mlx_stack-0.3.6}/uv.lock +0 -0
@@ -5,6 +5,9 @@ on:
5
5
  branches: [main]
6
6
  pull_request:
7
7
 
8
+ permissions:
9
+ contents: read
10
+
8
11
  concurrency:
9
12
  group: ${{ github.workflow }}-${{ github.head_ref || github.ref_name }}
10
13
  cancel-in-progress: true
@@ -9,6 +9,9 @@ on:
9
9
  description: "Specific model ID to test (blank = all non-gated models that fit in memory)"
10
10
  required: false
11
11
 
12
+ permissions:
13
+ contents: read
14
+
12
15
  concurrency:
13
16
  group: nightly-integration
14
17
  cancel-in-progress: true
@@ -5,6 +5,9 @@ on:
5
5
  types: [created]
6
6
  workflow_dispatch:
7
7
 
8
+ permissions:
9
+ contents: read
10
+
8
11
  concurrency:
9
12
  group: prerelease-integration
10
13
  cancel-in-progress: true
@@ -0,0 +1,3 @@
1
+ {
2
+ ".": "0.3.6"
3
+ }
@@ -4,6 +4,30 @@ All notable changes to this project will be documented in this file.
4
4
 
5
5
  The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/), and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
6
6
 
7
+ ## [0.3.6](https://github.com/weklund/mlx-stack/compare/v0.3.5...v0.3.6) (2026-04-04)
8
+
9
+
10
+ ### Bug Fixes
11
+
12
+ * add explicit permissions to CI and integration workflows ([#34](https://github.com/weklund/mlx-stack/issues/34)) ([0f8bfb0](https://github.com/weklund/mlx-stack/commit/0f8bfb0a17df82142261284f8d6405918ae6b759))
13
+
14
+ ## [0.3.5](https://github.com/weklund/mlx-stack/compare/v0.3.4...v0.3.5) (2026-04-04)
15
+
16
+
17
+ ### Features
18
+
19
+ * expand ruff lint rules with tier 1+2 quality rulesets ([#22](https://github.com/weklund/mlx-stack/issues/22)) ([75490f6](https://github.com/weklund/mlx-stack/commit/75490f6817a87a6b63818fa1f7c1660e59766ba3))
20
+
21
+
22
+ ### Refactors
23
+
24
+ * **tests:** replace brittle mock-heavy tests with behavioral tests and shared factories ([#32](https://github.com/weklund/mlx-stack/issues/32)) ([9af6078](https://github.com/weklund/mlx-stack/commit/9af60781e14c1466219ee2644928db9c9a39041e))
25
+ - `FakeServiceLayer` replaces 10-deep `@patch` stacks in `TestRunUp`
26
+ - Consolidate ~50 duplicate helpers into `tests/factories.py`
27
+ - AAA comments (`# Arrange`, `# Act`, `# Assert`) across 17 test files
28
+ - `make lint` now includes pyright for shift-left type checking
29
+ - Net: -577 lines, 1,481 tests pass, 73% reduction in `@patch` usage
30
+
7
31
  ## [0.3.4](https://github.com/weklund/mlx-stack/compare/v0.3.3...v0.3.4) (2026-04-03)
8
32
 
9
33
 
@@ -4,11 +4,12 @@
4
4
  install:
5
5
  uv sync --dev
6
6
 
7
- ## Lint source and tests
7
+ ## Lint source and tests (ruff + pyright)
8
8
  lint:
9
9
  uv run ruff check src/ tests/
10
+ uv run python -m pyright
10
11
 
11
- ## Run type checker across the full project
12
+ ## Run type checker only (alias kept for CI compatibility)
12
13
  typecheck:
13
14
  uv run python -m pyright
14
15
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: mlx-stack
3
- Version: 0.3.4
3
+ Version: 0.3.6
4
4
  Summary: CLI control plane for local LLM infrastructure on Apple Silicon
5
5
  Project-URL: Homepage, https://github.com/weklund/mlx-stack
6
6
  Project-URL: Repository, https://github.com/weklund/mlx-stack
@@ -43,8 +43,7 @@ Most local LLM tools serve **one model at a time** and leave you to figure out w
43
43
 
44
44
  ```bash
45
45
  uv tool install mlx-stack
46
- mlx-stack init --accept-defaults # detects hardware, picks models, generates configs
47
- mlx-stack up # 3 model servers + API gateway, one command
46
+ mlx-stack setup # detects hardware, picks models, pulls, starts — one command
48
47
  # → OpenAI-compatible API at http://localhost:4000/v1
49
48
  ```
50
49
 
@@ -170,6 +169,33 @@ uvx mlx-stack profile
170
169
 
171
170
  ## Quick Start
172
171
 
172
+ The fastest way to get running is the interactive setup command:
173
+
174
+ ```bash
175
+ mlx-stack setup
176
+ ```
177
+
178
+ This walks you through hardware detection, model selection, downloading, and starting all services in one guided flow. For CI or scripting, pass `--accept-defaults` to skip all prompts:
179
+
180
+ ```bash
181
+ mlx-stack setup --accept-defaults
182
+ ```
183
+
184
+ The OpenAI-compatible API is now available at `http://localhost:4000/v1`.
185
+
186
+ ```bash
187
+ # Check service health
188
+ mlx-stack status
189
+
190
+ # Stop everything when done
191
+ mlx-stack down
192
+ ```
193
+
194
+ <details>
195
+ <summary>Manual step-by-step setup</summary>
196
+
197
+ If you prefer full control over each step:
198
+
173
199
  ```bash
174
200
  # 1. Detect your hardware
175
201
  mlx-stack profile
@@ -187,17 +213,20 @@ mlx-stack up
187
213
  mlx-stack status
188
214
  ```
189
215
 
190
- The OpenAI-compatible API is now available at `http://localhost:4000/v1`.
191
-
192
- ```bash
193
- # Stop everything when done
194
- mlx-stack down
195
- ```
216
+ </details>
196
217
 
197
218
  ## CLI Reference
198
219
 
199
220
  ### Setup & Configuration
200
221
 
222
+ **`mlx-stack setup`** — Interactive guided setup: detects hardware, selects models, pulls weights, and starts the stack in one command.
223
+
224
+ | Option | Description |
225
+ |--------|-------------|
226
+ | `--accept-defaults` | Skip all prompts and use recommended defaults |
227
+ | `--intent <balanced\|agent-fleet>` | Use case intent (prompted if not provided) |
228
+ | `--budget-pct <10-90>` | Memory budget as percentage of unified memory (default: 40) |
229
+
201
230
  | Command | Description |
202
231
  |---------|-------------|
203
232
  | `mlx-stack profile` | Detect Apple Silicon hardware and save profile to `~/.mlx-stack/profile.json` |
@@ -323,7 +352,7 @@ mlx-stack is designed to run unattended on always-on hardware like a Mac Mini.
323
352
  ### Quick setup
324
353
 
325
354
  ```bash
326
- mlx-stack init --accept-defaults
355
+ mlx-stack setup --accept-defaults
327
356
  mlx-stack install
328
357
  ```
329
358
 
@@ -436,14 +465,12 @@ See [DEVELOPING.md](DEVELOPING.md) for the full developer guide, including proje
436
465
  # Install dev dependencies
437
466
  uv sync
438
467
 
439
- # Run tests
440
- uv run pytest
441
-
442
- # Type checking
443
- uv run python -m pyright
468
+ # Run all checks (lint + typecheck + tests) — same as CI
469
+ make check
444
470
 
445
- # Linting
446
- uv run ruff check src/ tests/
471
+ # Or individually
472
+ make lint # ruff + pyright
473
+ make test # pytest with coverage
447
474
  ```
448
475
 
449
476
  ## Contributing
@@ -14,8 +14,7 @@ Most local LLM tools serve **one model at a time** and leave you to figure out w
14
14
 
15
15
  ```bash
16
16
  uv tool install mlx-stack
17
- mlx-stack init --accept-defaults # detects hardware, picks models, generates configs
18
- mlx-stack up # 3 model servers + API gateway, one command
17
+ mlx-stack setup # detects hardware, picks models, pulls, starts — one command
19
18
  # → OpenAI-compatible API at http://localhost:4000/v1
20
19
  ```
21
20
 
@@ -141,6 +140,33 @@ uvx mlx-stack profile
141
140
 
142
141
  ## Quick Start
143
142
 
143
+ The fastest way to get running is the interactive setup command:
144
+
145
+ ```bash
146
+ mlx-stack setup
147
+ ```
148
+
149
+ This walks you through hardware detection, model selection, downloading, and starting all services in one guided flow. For CI or scripting, pass `--accept-defaults` to skip all prompts:
150
+
151
+ ```bash
152
+ mlx-stack setup --accept-defaults
153
+ ```
154
+
155
+ The OpenAI-compatible API is now available at `http://localhost:4000/v1`.
156
+
157
+ ```bash
158
+ # Check service health
159
+ mlx-stack status
160
+
161
+ # Stop everything when done
162
+ mlx-stack down
163
+ ```
164
+
165
+ <details>
166
+ <summary>Manual step-by-step setup</summary>
167
+
168
+ If you prefer full control over each step:
169
+
144
170
  ```bash
145
171
  # 1. Detect your hardware
146
172
  mlx-stack profile
@@ -158,17 +184,20 @@ mlx-stack up
158
184
  mlx-stack status
159
185
  ```
160
186
 
161
- The OpenAI-compatible API is now available at `http://localhost:4000/v1`.
162
-
163
- ```bash
164
- # Stop everything when done
165
- mlx-stack down
166
- ```
187
+ </details>
167
188
 
168
189
  ## CLI Reference
169
190
 
170
191
  ### Setup & Configuration
171
192
 
193
+ **`mlx-stack setup`** — Interactive guided setup: detects hardware, selects models, pulls weights, and starts the stack in one command.
194
+
195
+ | Option | Description |
196
+ |--------|-------------|
197
+ | `--accept-defaults` | Skip all prompts and use recommended defaults |
198
+ | `--intent <balanced\|agent-fleet>` | Use case intent (prompted if not provided) |
199
+ | `--budget-pct <10-90>` | Memory budget as percentage of unified memory (default: 40) |
200
+
172
201
  | Command | Description |
173
202
  |---------|-------------|
174
203
  | `mlx-stack profile` | Detect Apple Silicon hardware and save profile to `~/.mlx-stack/profile.json` |
@@ -294,7 +323,7 @@ mlx-stack is designed to run unattended on always-on hardware like a Mac Mini.
294
323
  ### Quick setup
295
324
 
296
325
  ```bash
297
- mlx-stack init --accept-defaults
326
+ mlx-stack setup --accept-defaults
298
327
  mlx-stack install
299
328
  ```
300
329
 
@@ -407,14 +436,12 @@ See [DEVELOPING.md](DEVELOPING.md) for the full developer guide, including proje
407
436
  # Install dev dependencies
408
437
  uv sync
409
438
 
410
- # Run tests
411
- uv run pytest
412
-
413
- # Type checking
414
- uv run python -m pyright
439
+ # Run all checks (lint + typecheck + tests) — same as CI
440
+ make check
415
441
 
416
- # Linting
417
- uv run ruff check src/ tests/
442
+ # Or individually
443
+ make lint # ruff + pyright
444
+ make test # pytest with coverage
418
445
  ```
419
446
 
420
447
  ## Contributing
@@ -67,7 +67,40 @@ line-length = 100
67
67
  src = ["src", "tests"]
68
68
 
69
69
  [tool.ruff.lint]
70
- select = ["E", "F", "I", "W"]
70
+ select = [
71
+ # Tier 1 — high value, very safe
72
+ "E", # pycodestyle errors
73
+ "F", # pyflakes
74
+ "I", # isort
75
+ "W", # pycodestyle warnings
76
+ "UP", # pyupgrade — modern Python syntax
77
+ "B", # bugbear — common bug patterns
78
+ "SIM", # simplify — reduce complexity
79
+ "C4", # flake8-comprehensions
80
+ "RUF", # Ruff-specific rules
81
+ # Tier 2 — strong value, minor tuning
82
+ "PIE", # misc cleanup
83
+ "RET", # return simplification
84
+ "PERF", # performance anti-patterns
85
+ "PT", # pytest style
86
+ # "C90", # mccabe complexity — enable after refactoring complex functions
87
+ "FURB", # modernization
88
+ "FLY", # f-string conversion
89
+ ]
90
+ ignore = [
91
+ "E501", # line length (formatter handles this)
92
+ "SIM108", # ternary operator (opinionated)
93
+ "SIM117", # nested with statements (clearer in test mocking patterns)
94
+ "PT018", # composite assertions (splitting weakens error messages)
95
+ "PT019", # fixture without value (usefixtures less readable)
96
+ "PT017", # assert in except (valid test pattern)
97
+ ]
98
+
99
+ [tool.ruff.lint.mccabe]
100
+ max-complexity = 10
101
+
102
+ [tool.ruff.lint.per-file-ignores]
103
+ "src/mlx_stack/_version.py" = ["RUF022"] # auto-generated by hatch-vcs
71
104
 
72
105
  [tool.pyright]
73
106
  pythonVersion = "3.13"
@@ -18,7 +18,7 @@ version_tuple: tuple[int | str, ...]
18
18
  commit_id: str | None
19
19
  __commit_id__: str | None
20
20
 
21
- __version__ = version = '0.3.4'
22
- __version_tuple__ = version_tuple = (0, 3, 4)
21
+ __version__ = version = '0.3.6'
22
+ __version_tuple__ = version_tuple = (0, 3, 6)
23
23
 
24
24
  __commit_id__ = commit_id = None
@@ -168,23 +168,16 @@ def _display_results(result: BenchmarkResult_, out: Console, save: bool = False)
168
168
  out.print(Text("Tool Calling", style="bold cyan"))
169
169
  tc = result.tool_call_result
170
170
  if tc.success:
171
- out.print(
172
- f" [green]✓ Valid tool call[/green] — "
173
- f"round-trip: {tc.round_trip_time:.2f}s"
174
- )
171
+ out.print(f" [green]✓ Valid tool call[/green] — round-trip: {tc.round_trip_time:.2f}s")
175
172
  else:
176
- out.print(
177
- f" [red]✗ Tool call failed[/red] — {tc.error}"
178
- )
173
+ out.print(f" [red]✗ Tool call failed[/red] — {tc.error}")
179
174
  out.print()
180
175
  elif not result.tool_call_result:
181
176
  # Check if model supports tool calling from entry
182
177
  if not result.catalog_data_available:
183
178
  pass # Skip silently if no catalog data
184
179
  else:
185
- out.print(
186
- "[dim]Tool calling: skipped (model does not support tool calling)[/dim]"
187
- )
180
+ out.print("[dim]Tool calling: skipped (model does not support tool calling)[/dim]")
188
181
  out.print()
189
182
 
190
183
  # Iteration details
@@ -212,6 +205,8 @@ def _display_results(result: BenchmarkResult_, out: Console, save: bool = False)
212
205
 
213
206
  # Save confirmation
214
207
  if save:
215
- out.print("[green]✓ Results saved.[/green] "
216
- "These will be used by 'recommend' and 'init' for scoring.")
208
+ out.print(
209
+ "[green]✓ Results saved.[/green] "
210
+ "These will be used by 'recommend' and 'init' for scoring."
211
+ )
217
212
  out.print()
@@ -138,9 +138,7 @@ def config_reset(yes: bool, force: bool) -> None:
138
138
  # Check if stdin is a TTY for interactive confirmation
139
139
  try:
140
140
  if click.get_text_stream("stdin").isatty():
141
- confirmed = click.confirm(
142
- "Reset all configuration to defaults?", default=False
143
- )
141
+ confirmed = click.confirm("Reset all configuration to defaults?", default=False)
144
142
  else:
145
143
  console.print(
146
144
  "[bold red]Error:[/bold red] Reset requires --yes or --force flag "
@@ -64,13 +64,10 @@ def _display_summary(result: dict) -> None:
64
64
  budget_gb = result["memory_budget_gb"]
65
65
  total_memory_gb = result.get("total_memory_gb", 0.0)
66
66
  out.print(
67
- f"[dim]Hardware: {profile.chip} ({profile.memory_gb} GB) · "
68
- f"Budget: {budget_gb:.1f} GB[/dim]"
67
+ f"[dim]Hardware: {profile.chip} ({profile.memory_gb} GB) · Budget: {budget_gb:.1f} GB[/dim]"
69
68
  )
70
69
  if total_memory_gb > 0:
71
- out.print(
72
- f"[dim]Total estimated memory: {total_memory_gb:.1f} GB[/dim]"
73
- )
70
+ out.print(f"[dim]Total estimated memory: {total_memory_gb:.1f} GB[/dim]")
74
71
 
75
72
  # Warnings (e.g., memory budget exceeded with --add)
76
73
  init_warnings = result.get("warnings", [])
@@ -83,8 +80,7 @@ def _display_summary(result: dict) -> None:
83
80
  if stack.get("cloud_fallback"):
84
81
  out.print()
85
82
  out.print(
86
- "[bold green]☁ Cloud Fallback[/bold green] "
87
- "Premium tier via OpenRouter configured"
83
+ "[bold green]☁ Cloud Fallback[/bold green] Premium tier via OpenRouter configured"
88
84
  )
89
85
 
90
86
  # Missing models warning
@@ -42,9 +42,7 @@ def _display_status(status: AgentStatus) -> None:
42
42
  if not status.installed:
43
43
  out.print(Text("Status: not installed", style="dim"))
44
44
  elif status.running and status.pid is not None:
45
- out.print(
46
- Text(f"Status: installed and running (PID {status.pid})", style="green")
47
- )
45
+ out.print(Text(f"Status: installed and running (PID {status.pid})", style="green"))
48
46
  else:
49
47
  out.print(Text("Status: installed but not running", style="yellow"))
50
48
 
@@ -6,6 +6,7 @@ trigger on-demand rotation, and view archived logs.
6
6
 
7
7
  from __future__ import annotations
8
8
 
9
+ import contextlib
9
10
  import sys
10
11
 
11
12
  import click
@@ -78,7 +79,7 @@ def _display_rotation_results(results: list) -> None:
78
79
  out.print(f"[green]✓[/green] {result.service}: rotated")
79
80
  any_rotated = True
80
81
  else:
81
- out.print(f"[dim][/dim] {result.service}: no rotation needed")
82
+ out.print(f"[dim]-[/dim] {result.service}: no rotation needed")
82
83
 
83
84
  if not results:
84
85
  out.print(Text("No log files found to rotate.", style="yellow"))
@@ -213,11 +214,8 @@ def logs(
213
214
  # Handle --follow mode
214
215
  if follow:
215
216
  num = tail_lines if tail_lines is not None else DEFAULT_TAIL_LINES
216
- try:
217
+ with contextlib.suppress(KeyboardInterrupt):
217
218
  follow_log(log_path, num_lines=num, output_callback=click.echo)
218
- except KeyboardInterrupt:
219
- # Belt-and-suspenders: ensure clean exit
220
- pass
221
219
  return
222
220
 
223
221
  # Default: show tail of log
@@ -80,7 +80,7 @@ def _display_local_models() -> None:
80
80
  indicator_style = "bold green" if model.is_active else ""
81
81
 
82
82
  # Display name: prefer catalog name, fall back to directory name
83
- display_name = model.catalog_name if model.catalog_name else model.name
83
+ display_name = model.catalog_name or model.name
84
84
 
85
85
  # Size
86
86
  size_str = format_size(model.disk_size_bytes)
@@ -217,7 +217,7 @@ def _display_catalog(
217
217
  local_style = "bold green" if cm.is_local else ""
218
218
 
219
219
  # Parameters
220
- params_str = f"{cm.params_b:.1f}B" if cm.params_b >= 1.0 else f"{cm.params_b:.1f}B"
220
+ params_str = f"{cm.params_b:.1f}B"
221
221
 
222
222
  # Quantizations
223
223
  quants_str = ", ".join(cm.quants)
@@ -270,7 +270,9 @@ def _display_catalog(
270
270
  @click.option("--family", default=None, help="Filter catalog by model family (e.g., 'qwen3.5').")
271
271
  @click.option("--tag", default=None, help="Filter catalog by tag (e.g., 'agent-ready').")
272
272
  @click.option(
273
- "--tool-calling", "tool_calling", is_flag=True,
273
+ "--tool-calling",
274
+ "tool_calling",
275
+ is_flag=True,
274
276
  help="Filter catalog to tool-calling-capable models only.",
275
277
  )
276
278
  def models(
@@ -52,12 +52,8 @@ def profile() -> None:
52
52
 
53
53
  if hw.is_estimate:
54
54
  out.print()
55
- out.print(
56
- "[yellow] Bandwidth is estimated for unknown chip.[/yellow]"
57
- )
58
- out.print(
59
- " Run [bold]mlx-stack bench --save[/bold] to calibrate with real measurements."
60
- )
55
+ out.print("[yellow]⚠ Bandwidth is estimated for unknown chip.[/yellow]")
56
+ out.print(" Run [bold]mlx-stack bench --save[/bold] to calibrate with real measurements.")
61
57
 
62
58
  out.print()
63
59
  from mlx_stack.core.paths import get_profile_path
@@ -115,20 +115,13 @@ def _run_post_download_bench(model_id: str, quant: str, out: Console) -> None:
115
115
  from mlx_stack.core.benchmark import BenchmarkError, run_benchmark
116
116
 
117
117
  result = run_benchmark(target=model_id, save=True)
118
- out.print(
119
- f" Prompt TPS: {result.prompt_tps_mean:.1f} ± {result.prompt_tps_std:.1f} tok/s"
120
- )
121
- out.print(
122
- f" Gen TPS: {result.gen_tps_mean:.1f} ± {result.gen_tps_std:.1f} tok/s"
123
- )
118
+ out.print(f" Prompt TPS: {result.prompt_tps_mean:.1f} ± {result.prompt_tps_std:.1f} tok/s")
119
+ out.print(f" Gen TPS: {result.gen_tps_mean:.1f} ± {result.gen_tps_std:.1f} tok/s")
124
120
  out.print()
125
- out.print(
126
- "[dim]Results saved for use by 'recommend' and 'init' scoring.[/dim]"
127
- )
121
+ out.print("[dim]Results saved for use by 'recommend' and 'init' scoring.[/dim]")
128
122
  except BenchmarkError as exc:
129
123
  out.print(
130
- f"[yellow]Benchmark failed: {exc}[/yellow]\n"
131
- f"Run 'mlx-stack bench {model_id}' to retry."
124
+ f"[yellow]Benchmark failed: {exc}[/yellow]\nRun 'mlx-stack bench {model_id}' to retry."
132
125
  )
133
126
  except Exception as exc:
134
127
  out.print(
@@ -67,9 +67,7 @@ def parse_budget(raw: str) -> float:
67
67
 
68
68
  value = float(match.group(1))
69
69
  if value <= 0:
70
- msg = (
71
- f"Invalid budget '{raw}'. Budget must be a positive value."
72
- )
70
+ msg = f"Invalid budget '{raw}'. Budget must be a positive value."
73
71
  raise click.BadParameter(msg, param_hint="'--budget'")
74
72
 
75
73
  return value
@@ -96,8 +94,7 @@ def _resolve_profile() -> HardwareProfile:
96
94
  # Auto-detect (in-memory only — recommend is display-only, no file writes)
97
95
  console.print("[dim]No saved profile found — detecting hardware...[/dim]")
98
96
  try:
99
- profile = detect_hardware()
100
- return profile
97
+ return detect_hardware()
101
98
  except HardwareError as exc:
102
99
  console.print(f"[bold red]Error:[/bold red] {exc}")
103
100
  raise SystemExit(1) from None
@@ -206,12 +203,8 @@ def _display_tier_table(result: RecommendationResult) -> None:
206
203
  has_estimates = any(t.model.is_estimated for t in result.tiers)
207
204
  if has_estimates:
208
205
  out.print()
209
- out.print(
210
- "[yellow] Some performance values are estimated from bandwidth ratio.[/yellow]"
211
- )
212
- out.print(
213
- " Run [bold]mlx-stack bench --save[/bold] to calibrate with real measurements."
214
- )
206
+ out.print("[yellow]⚠ Some performance values are estimated from bandwidth ratio.[/yellow]")
207
+ out.print(" Run [bold]mlx-stack bench --save[/bold] to calibrate with real measurements.")
215
208
 
216
209
  out.print()
217
210
  out.print("[dim]This is a recommendation only — no files were written.[/dim]")
@@ -268,20 +261,15 @@ def _display_all_models(result: RecommendationResult) -> None:
268
261
  if openrouter_key:
269
262
  out.print()
270
263
  out.print(
271
- "[bold green]☁ Cloud Fallback[/bold green] "
272
- "Premium tier via OpenRouter also available."
264
+ "[bold green]☁ Cloud Fallback[/bold green] Premium tier via OpenRouter also available."
273
265
  )
274
266
 
275
267
  # Estimated warning
276
268
  has_estimates = any(m.is_estimated for m in result.all_scored)
277
269
  if has_estimates:
278
270
  out.print()
279
- out.print(
280
- "[yellow] Some performance values are estimated from bandwidth ratio.[/yellow]"
281
- )
282
- out.print(
283
- " Run [bold]mlx-stack bench --save[/bold] to calibrate with real measurements."
284
- )
271
+ out.print("[yellow]⚠ Some performance values are estimated from bandwidth ratio.[/yellow]")
272
+ out.print(" Run [bold]mlx-stack bench --save[/bold] to calibrate with real measurements.")
285
273
 
286
274
  out.print()
287
275
  out.print("[dim]This is a recommendation only — no files were written.[/dim]")
@@ -329,8 +317,7 @@ def recommend(budget: str | None, intent: str | None, show_all: bool) -> None:
329
317
  elif intent not in VALID_INTENTS:
330
318
  valid = ", ".join(sorted(VALID_INTENTS))
331
319
  console.print(
332
- f"[bold red]Error:[/bold red] Invalid intent '{intent}'. "
333
- f"Valid intents: {valid}"
320
+ f"[bold red]Error:[/bold red] Invalid intent '{intent}'. Valid intents: {valid}"
334
321
  )
335
322
  raise SystemExit(1)
336
323