localcode 0.2.15__tar.gz → 0.2.16__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (943) hide show
  1. {localcode-0.2.15/src/localcode.egg-info → localcode-0.2.16}/PKG-INFO +22 -5
  2. {localcode-0.2.15 → localcode-0.2.16}/README.md +21 -4
  3. {localcode-0.2.15 → localcode-0.2.16}/pyproject.toml +1 -1
  4. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/__init__.py +1 -1
  5. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/__init__.py +2 -3
  6. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/helpers.py +0 -10
  7. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/sections.py +2 -11
  8. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/app.py +1 -63
  9. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/autonomy.py +0 -15
  10. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/bootstrap.py +6 -15
  11. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/formatting.py +0 -9
  12. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/model_families.py +1 -1
  13. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/models_catalog.py +45 -46
  14. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/patching.py +0 -25
  15. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/plans.py +0 -8
  16. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/process_registry.py +0 -20
  17. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/recommendations.py +1 -1
  18. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/runtime.py +1 -1
  19. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/snapshots.py +0 -18
  20. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/telemetry.py +0 -18
  21. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/theme.py +1 -20
  22. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tool_parsing.py +0 -11
  23. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tool_router.py +0 -60
  24. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/screens/chat.py +22 -10
  25. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/screens/setup.py +7 -7
  26. localcode-0.2.16/src/localcode/verification.py +87 -0
  27. {localcode-0.2.15 → localcode-0.2.16/src/localcode.egg-info}/PKG-INFO +22 -5
  28. {localcode-0.2.15 → localcode-0.2.16}/tests/test_agent_event_regressions.py +0 -24
  29. localcode-0.2.15/src/localcode/verification.py +0 -197
  30. {localcode-0.2.15 → localcode-0.2.16}/LICENSE +0 -0
  31. {localcode-0.2.15 → localcode-0.2.16}/MANIFEST.in +0 -0
  32. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/CMakeLists.txt +0 -0
  33. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/CMakePresets.json +0 -0
  34. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/LICENSE +0 -0
  35. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/arm64-apple-clang.cmake +0 -0
  36. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/arm64-windows-llvm.cmake +0 -0
  37. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/build-info.cmake +0 -0
  38. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/common.cmake +0 -0
  39. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/download-models.cmake +0 -0
  40. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/git-vars.cmake +0 -0
  41. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/license.cmake +0 -0
  42. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/llama-config.cmake.in +0 -0
  43. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/llama.pc.in +0 -0
  44. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/riscv64-spacemit-linux-gnu-gcc.cmake +0 -0
  45. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/cmake/x64-windows-llvm.cmake +0 -0
  46. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/CMakeLists.txt +0 -0
  47. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/arg.cpp +0 -0
  48. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/arg.h +0 -0
  49. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/base64.hpp +0 -0
  50. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-auto-parser-generator.cpp +0 -0
  51. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-auto-parser-helpers.cpp +0 -0
  52. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-auto-parser-helpers.h +0 -0
  53. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-auto-parser.h +0 -0
  54. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-diff-analyzer.cpp +0 -0
  55. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-peg-parser.cpp +0 -0
  56. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat-peg-parser.h +0 -0
  57. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat.cpp +0 -0
  58. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/chat.h +0 -0
  59. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/common.cpp +0 -0
  60. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/common.h +0 -0
  61. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/console.cpp +0 -0
  62. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/console.h +0 -0
  63. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/debug.cpp +0 -0
  64. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/debug.h +0 -0
  65. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/download.cpp +0 -0
  66. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/download.h +0 -0
  67. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/hf-cache.cpp +0 -0
  68. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/hf-cache.h +0 -0
  69. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/http.h +0 -0
  70. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/caps.cpp +0 -0
  71. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/caps.h +0 -0
  72. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/lexer.cpp +0 -0
  73. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/lexer.h +0 -0
  74. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/parser.cpp +0 -0
  75. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/parser.h +0 -0
  76. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/runtime.cpp +0 -0
  77. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/runtime.h +0 -0
  78. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/string.cpp +0 -0
  79. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/string.h +0 -0
  80. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/utils.h +0 -0
  81. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/value.cpp +0 -0
  82. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/jinja/value.h +0 -0
  83. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/json-partial.cpp +0 -0
  84. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/json-partial.h +0 -0
  85. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/json-schema-to-grammar.cpp +0 -0
  86. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/json-schema-to-grammar.h +0 -0
  87. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/llguidance.cpp +0 -0
  88. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/log.cpp +0 -0
  89. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/log.h +0 -0
  90. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/ngram-cache.cpp +0 -0
  91. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/ngram-cache.h +0 -0
  92. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/ngram-map.cpp +0 -0
  93. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/ngram-map.h +0 -0
  94. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/ngram-mod.cpp +0 -0
  95. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/ngram-mod.h +0 -0
  96. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/peg-parser.cpp +0 -0
  97. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/peg-parser.h +0 -0
  98. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/preset.cpp +0 -0
  99. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/preset.h +0 -0
  100. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/reasoning-budget.cpp +0 -0
  101. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/reasoning-budget.h +0 -0
  102. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/regex-partial.cpp +0 -0
  103. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/regex-partial.h +0 -0
  104. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/sampling.cpp +0 -0
  105. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/sampling.h +0 -0
  106. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/speculative.cpp +0 -0
  107. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/speculative.h +0 -0
  108. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/unicode.cpp +0 -0
  109. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/common/unicode.h +0 -0
  110. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-alloc.h +0 -0
  111. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-backend.h +0 -0
  112. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-blas.h +0 -0
  113. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-cann.h +0 -0
  114. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-cpp.h +0 -0
  115. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-cpu.h +0 -0
  116. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-cuda.h +0 -0
  117. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-hexagon.h +0 -0
  118. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-metal.h +0 -0
  119. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-opencl.h +0 -0
  120. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-openvino.h +0 -0
  121. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-opt.h +0 -0
  122. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-rpc.h +0 -0
  123. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-sycl.h +0 -0
  124. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-virtgpu.h +0 -0
  125. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-vulkan.h +0 -0
  126. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-webgpu.h +0 -0
  127. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-zdnn.h +0 -0
  128. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml-zendnn.h +0 -0
  129. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/ggml.h +0 -0
  130. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/include/gguf.h +0 -0
  131. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/CMakeLists.txt +0 -0
  132. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-alloc.c +0 -0
  133. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-backend-dl.cpp +0 -0
  134. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-backend-dl.h +0 -0
  135. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-backend-impl.h +0 -0
  136. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-backend-reg.cpp +0 -0
  137. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-backend.cpp +0 -0
  138. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-blas/CMakeLists.txt +0 -0
  139. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-blas/ggml-blas.cpp +0 -0
  140. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/CMakeLists.txt +0 -0
  141. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/acl_tensor.cpp +0 -0
  142. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/acl_tensor.h +0 -0
  143. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/aclnn_ops.cpp +0 -0
  144. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/aclnn_ops.h +0 -0
  145. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/common.h +0 -0
  146. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cann/ggml-cann.cpp +0 -0
  147. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-common.h +0 -0
  148. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/CMakeLists.txt +0 -0
  149. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/amx/amx.cpp +0 -0
  150. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/amx/amx.h +0 -0
  151. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/amx/common.h +0 -0
  152. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/amx/mmq.cpp +0 -0
  153. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/amx/mmq.h +0 -0
  154. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/arm/cpu-feats.cpp +0 -0
  155. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/arm/quants.c +0 -0
  156. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/arm/repack.cpp +0 -0
  157. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/loongarch/quants.c +0 -0
  158. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/powerpc/cpu-feats.cpp +0 -0
  159. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/powerpc/quants.c +0 -0
  160. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/riscv/cpu-feats.cpp +0 -0
  161. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/riscv/quants.c +0 -0
  162. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/riscv/repack.cpp +0 -0
  163. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/s390/cpu-feats.cpp +0 -0
  164. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/s390/quants.c +0 -0
  165. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/wasm/quants.c +0 -0
  166. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/x86/cpu-feats.cpp +0 -0
  167. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/x86/quants.c +0 -0
  168. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch/x86/repack.cpp +0 -0
  169. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/arch-fallback.h +0 -0
  170. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/binary-ops.cpp +0 -0
  171. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/binary-ops.h +0 -0
  172. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/cmake/FindSIMD.cmake +0 -0
  173. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/common.h +0 -0
  174. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/ggml-cpu-impl.h +0 -0
  175. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/ggml-cpu.c +0 -0
  176. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/ggml-cpu.cpp +0 -0
  177. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/hbm.cpp +0 -0
  178. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/hbm.h +0 -0
  179. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/kleidiai/kernels.cpp +0 -0
  180. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/kleidiai/kernels.h +0 -0
  181. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/kleidiai/kleidiai.cpp +0 -0
  182. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/kleidiai/kleidiai.h +0 -0
  183. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/llamafile/sgemm.cpp +0 -0
  184. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/llamafile/sgemm.h +0 -0
  185. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/ops.cpp +0 -0
  186. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/ops.h +0 -0
  187. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/quants.c +0 -0
  188. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/quants.h +0 -0
  189. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/repack.cpp +0 -0
  190. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/repack.h +0 -0
  191. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/simd-gemm.h +0 -0
  192. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/simd-mappings.h +0 -0
  193. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/spacemit/ime.cpp +0 -0
  194. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/spacemit/ime.h +0 -0
  195. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/spacemit/ime1_kernels.cpp +0 -0
  196. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/spacemit/ime_kernels.h +0 -0
  197. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/traits.cpp +0 -0
  198. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/traits.h +0 -0
  199. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/unary-ops.cpp +0 -0
  200. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/unary-ops.h +0 -0
  201. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/vec.cpp +0 -0
  202. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cpu/vec.h +0 -0
  203. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cuda/CMakeLists.txt +0 -0
  204. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cuda/vendors/cuda.h +0 -0
  205. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cuda/vendors/hip.h +0 -0
  206. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-cuda/vendors/musa.h +0 -0
  207. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/CMakeLists.txt +0 -0
  208. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/ggml-hexagon.cpp +0 -0
  209. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/CMakeLists.txt +0 -0
  210. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/act-ops.c +0 -0
  211. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/argsort-ops.c +0 -0
  212. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/binary-ops.c +0 -0
  213. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/cmake-toolchain.cmake +0 -0
  214. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/cpy-ops.c +0 -0
  215. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/cumsum-ops.c +0 -0
  216. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/flash-attn-ops.c +0 -0
  217. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/get-rows-ops.c +0 -0
  218. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-dma.c +0 -0
  219. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-dma.h +0 -0
  220. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-dump.h +0 -0
  221. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-fastdiv.h +0 -0
  222. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hex-utils.h +0 -0
  223. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hmx-matmul-ops.c +0 -0
  224. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hmx-ops.h +0 -0
  225. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hmx-profile.h +0 -0
  226. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hmx-utils.h +0 -0
  227. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/htp-ctx.h +0 -0
  228. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/htp-msg.h +0 -0
  229. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/htp-ops.h +0 -0
  230. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-arith.h +0 -0
  231. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-base.h +0 -0
  232. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-copy.h +0 -0
  233. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-div.h +0 -0
  234. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-dump.h +0 -0
  235. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-exp.h +0 -0
  236. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-floor.h +0 -0
  237. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-inverse.h +0 -0
  238. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-reduce.h +0 -0
  239. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-scale.h +0 -0
  240. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-sigmoid.h +0 -0
  241. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-sqrt.h +0 -0
  242. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-types.h +0 -0
  243. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/hvx-utils.h +0 -0
  244. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/main.c +0 -0
  245. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/matmul-ops.c +0 -0
  246. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/repeat-ops.c +0 -0
  247. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/rope-ops.c +0 -0
  248. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/set-rows-ops.c +0 -0
  249. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/softmax-ops.c +0 -0
  250. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/ssm-conv.c +0 -0
  251. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/sum-rows-ops.c +0 -0
  252. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/unary-ops.c +0 -0
  253. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/worker-pool.c +0 -0
  254. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp/worker-pool.h +0 -0
  255. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp-drv.cpp +0 -0
  256. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/htp-drv.h +0 -0
  257. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/libdl.h +0 -0
  258. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hexagon/op-desc.h +0 -0
  259. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-hip/CMakeLists.txt +0 -0
  260. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-impl.h +0 -0
  261. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/CMakeLists.txt +0 -0
  262. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-common.cpp +0 -0
  263. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-common.h +0 -0
  264. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-context.h +0 -0
  265. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-context.m +0 -0
  266. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-device.cpp +0 -0
  267. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-device.h +0 -0
  268. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-device.m +0 -0
  269. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-impl.h +0 -0
  270. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-ops.cpp +0 -0
  271. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal-ops.h +0 -0
  272. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal.cpp +0 -0
  273. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/ggml-metal.metal +0 -0
  274. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/turbo-matrices.h +0 -0
  275. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-metal/turbo-wht.h +0 -0
  276. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-musa/CMakeLists.txt +0 -0
  277. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-opencl/CMakeLists.txt +0 -0
  278. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-opencl/ggml-opencl.cpp +0 -0
  279. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/CMakeLists.txt +0 -0
  280. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-decoder.cpp +0 -0
  281. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-decoder.h +0 -0
  282. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-openvino-extra.cpp +0 -0
  283. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-openvino-extra.h +0 -0
  284. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-openvino.cpp +0 -0
  285. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-quants.cpp +0 -0
  286. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/ggml-quants.h +0 -0
  287. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/decoder.h +0 -0
  288. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/frontend.cpp +0 -0
  289. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/frontend.h +0 -0
  290. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/input_model.cpp +0 -0
  291. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/input_model.h +0 -0
  292. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/node_context.h +0 -0
  293. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/cont.cpp +0 -0
  294. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/cpy.cpp +0 -0
  295. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/flash_attn_ext.cpp +0 -0
  296. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/get_rows.cpp +0 -0
  297. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/glu_geglu.cpp +0 -0
  298. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/glu_swiglu.cpp +0 -0
  299. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/mulmat.cpp +0 -0
  300. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/permute.cpp +0 -0
  301. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/reshape.cpp +0 -0
  302. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/rms_norm.cpp +0 -0
  303. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/rope.cpp +0 -0
  304. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/scale.cpp +0 -0
  305. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/set_rows.cpp +0 -0
  306. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/softmax.cpp +0 -0
  307. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/transpose.cpp +0 -0
  308. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/unary_silu.cpp +0 -0
  309. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op/view.cpp +0 -0
  310. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op_table.cpp +0 -0
  311. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/op_table.h +0 -0
  312. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/eliminate_zp.cpp +0 -0
  313. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/eliminate_zp.h +0 -0
  314. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/fuse_to_sdpa.cpp +0 -0
  315. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/fuse_to_sdpa.h +0 -0
  316. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/mark_decompression_convert_constant_folding.h +0 -0
  317. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/squeeze_matmul.cpp +0 -0
  318. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/pass/squeeze_matmul.h +0 -0
  319. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/translate_session.cpp +0 -0
  320. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/translate_session.h +0 -0
  321. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/utils.cpp +0 -0
  322. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/openvino/utils.h +0 -0
  323. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/utils.cpp +0 -0
  324. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-openvino/utils.h +0 -0
  325. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-opt.cpp +0 -0
  326. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-quants.c +0 -0
  327. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-quants.h +0 -0
  328. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-rpc/CMakeLists.txt +0 -0
  329. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-rpc/ggml-rpc.cpp +0 -0
  330. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/CMakeLists.txt +0 -0
  331. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/add-id.cpp +0 -0
  332. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/add-id.hpp +0 -0
  333. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/backend.hpp +0 -0
  334. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/binbcast.cpp +0 -0
  335. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/binbcast.hpp +0 -0
  336. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/common.cpp +0 -0
  337. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/common.hpp +0 -0
  338. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/concat.cpp +0 -0
  339. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/concat.hpp +0 -0
  340. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/conv.cpp +0 -0
  341. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/conv.hpp +0 -0
  342. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/convert.cpp +0 -0
  343. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/convert.hpp +0 -0
  344. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/count-equal.cpp +0 -0
  345. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/count-equal.hpp +0 -0
  346. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/cpy.cpp +0 -0
  347. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/cpy.hpp +0 -0
  348. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/dequantize.hpp +0 -0
  349. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/dmmv.cpp +0 -0
  350. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/dmmv.hpp +0 -0
  351. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/dpct/helper.hpp +0 -0
  352. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/element_wise.cpp +0 -0
  353. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/element_wise.hpp +0 -0
  354. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/fattn-common.hpp +0 -0
  355. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/fattn-tile.cpp +0 -0
  356. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/fattn-tile.hpp +0 -0
  357. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/fattn-vec.hpp +0 -0
  358. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/fattn.cpp +0 -0
  359. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/fattn.hpp +0 -0
  360. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/gated_delta_net.cpp +0 -0
  361. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/gated_delta_net.hpp +0 -0
  362. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/gemm.hpp +0 -0
  363. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/getrows.cpp +0 -0
  364. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/getrows.hpp +0 -0
  365. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/ggml-sycl.cpp +0 -0
  366. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/gla.cpp +0 -0
  367. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/gla.hpp +0 -0
  368. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/im2col.cpp +0 -0
  369. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/im2col.hpp +0 -0
  370. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/mmq.cpp +0 -0
  371. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/mmq.hpp +0 -0
  372. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/mmvq.cpp +0 -0
  373. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/mmvq.hpp +0 -0
  374. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/norm.cpp +0 -0
  375. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/norm.hpp +0 -0
  376. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/outprod.cpp +0 -0
  377. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/outprod.hpp +0 -0
  378. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/pad.cpp +0 -0
  379. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/pad.hpp +0 -0
  380. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/pad_reflect_1d.cpp +0 -0
  381. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/pad_reflect_1d.hpp +0 -0
  382. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/presets.hpp +0 -0
  383. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/quantize.hpp +0 -0
  384. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/quants.hpp +0 -0
  385. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/repeat_back.cpp +0 -0
  386. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/repeat_back.hpp +0 -0
  387. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/roll.cpp +0 -0
  388. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/roll.hpp +0 -0
  389. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/rope.cpp +0 -0
  390. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/rope.hpp +0 -0
  391. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/set.cpp +0 -0
  392. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/set.hpp +0 -0
  393. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/set_rows.cpp +0 -0
  394. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/set_rows.hpp +0 -0
  395. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/softmax.cpp +0 -0
  396. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/softmax.hpp +0 -0
  397. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/ssm_conv.cpp +0 -0
  398. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/ssm_conv.hpp +0 -0
  399. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/sycl_hw.cpp +0 -0
  400. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/sycl_hw.hpp +0 -0
  401. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq112-dv112.cpp +0 -0
  402. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq128-dv128.cpp +0 -0
  403. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq256-dv256.cpp +0 -0
  404. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq40-dv40.cpp +0 -0
  405. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq576-dv512.cpp +0 -0
  406. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq64-dv64.cpp +0 -0
  407. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq72-dv72.cpp +0 -0
  408. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq80-dv80.cpp +0 -0
  409. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-tile-instance-dkq96-dv96.cpp +0 -0
  410. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-f16.cpp +0 -0
  411. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q4_0.cpp +0 -0
  412. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q4_1.cpp +0 -0
  413. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q5_0.cpp +0 -0
  414. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q5_1.cpp +0 -0
  415. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-f16-q8_0.cpp +0 -0
  416. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-f16.cpp +0 -0
  417. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q4_0.cpp +0 -0
  418. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q4_1.cpp +0 -0
  419. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q5_0.cpp +0 -0
  420. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q5_1.cpp +0 -0
  421. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_0-q8_0.cpp +0 -0
  422. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-f16.cpp +0 -0
  423. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q4_0.cpp +0 -0
  424. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q4_1.cpp +0 -0
  425. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q5_0.cpp +0 -0
  426. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q5_1.cpp +0 -0
  427. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q4_1-q8_0.cpp +0 -0
  428. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-f16.cpp +0 -0
  429. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q4_0.cpp +0 -0
  430. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q4_1.cpp +0 -0
  431. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q5_0.cpp +0 -0
  432. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q5_1.cpp +0 -0
  433. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_0-q8_0.cpp +0 -0
  434. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-f16.cpp +0 -0
  435. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q4_0.cpp +0 -0
  436. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q4_1.cpp +0 -0
  437. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q5_0.cpp +0 -0
  438. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q5_1.cpp +0 -0
  439. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q5_1-q8_0.cpp +0 -0
  440. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-f16.cpp +0 -0
  441. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q4_0.cpp +0 -0
  442. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q4_1.cpp +0 -0
  443. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q5_0.cpp +0 -0
  444. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q5_1.cpp +0 -0
  445. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/template-instances/fattn-vec-instance-q8_0-q8_0.cpp +0 -0
  446. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/tsembd.cpp +0 -0
  447. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/tsembd.hpp +0 -0
  448. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/type.hpp +0 -0
  449. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/upscale.cpp +0 -0
  450. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/upscale.hpp +0 -0
  451. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/vecdotq.hpp +0 -0
  452. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/wkv.cpp +0 -0
  453. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-sycl/wkv.hpp +0 -0
  454. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-threading.cpp +0 -0
  455. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-threading.h +0 -0
  456. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-turbo-quant.c +0 -0
  457. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/CMakeLists.txt +0 -0
  458. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/apir_cs_ggml-rpc-front.cpp +0 -0
  459. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/CMakeLists.txt +0 -0
  460. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/apir_cs_ggml-rpc-back.cpp +0 -0
  461. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-convert.h +0 -0
  462. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched-backend.cpp +0 -0
  463. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched-buffer-type.cpp +0 -0
  464. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched-buffer.cpp +0 -0
  465. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched-device.cpp +0 -0
  466. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched.cpp +0 -0
  467. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched.gen.h +0 -0
  468. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-dispatched.h +0 -0
  469. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend-virgl-apir.h +0 -0
  470. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/backend.cpp +0 -0
  471. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/api_remoting.h +0 -0
  472. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_backend.gen.h +0 -0
  473. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_backend.h +0 -0
  474. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_cs.h +0 -0
  475. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_cs_ggml.h +0 -0
  476. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/backend/shared/apir_cs_rpc.h +0 -0
  477. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend-buffer-type.cpp +0 -0
  478. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend-buffer.cpp +0 -0
  479. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend-device.cpp +0 -0
  480. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend-reg.cpp +0 -0
  481. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-backend.cpp +0 -0
  482. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/ggml-remoting.h +0 -0
  483. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/include/apir_hw.h +0 -0
  484. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-apir.h +0 -0
  485. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-backend.cpp +0 -0
  486. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-buffer-type.cpp +0 -0
  487. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-buffer.cpp +0 -0
  488. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-device.cpp +0 -0
  489. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward-impl.h +0 -0
  490. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-forward.gen.h +0 -0
  491. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-shm.cpp +0 -0
  492. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-shm.h +0 -0
  493. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-utils.cpp +0 -0
  494. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu-utils.h +0 -0
  495. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu.cpp +0 -0
  496. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-virtgpu/virtgpu.h +0 -0
  497. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-vulkan/CMakeLists.txt +0 -0
  498. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-vulkan/ggml-vulkan.cpp +0 -0
  499. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-vulkan/vulkan-shaders/CMakeLists.txt +0 -0
  500. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp +0 -0
  501. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-webgpu/CMakeLists.txt +0 -0
  502. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-webgpu/ggml-webgpu-shader-lib.hpp +0 -0
  503. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-webgpu/ggml-webgpu.cpp +0 -0
  504. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-webgpu/pre_wgsl.hpp +0 -0
  505. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/CMakeLists.txt +0 -0
  506. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/common.hpp +0 -0
  507. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/ggml-zdnn.cpp +0 -0
  508. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/mmf.cpp +0 -0
  509. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/mmf.hpp +0 -0
  510. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/utils.cpp +0 -0
  511. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zdnn/utils.hpp +0 -0
  512. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zendnn/CMakeLists.txt +0 -0
  513. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml-zendnn/ggml-zendnn.cpp +0 -0
  514. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml.c +0 -0
  515. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/ggml.cpp +0 -0
  516. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/ggml/src/gguf.cpp +0 -0
  517. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/include/llama-cpp.h +0 -0
  518. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/include/llama.h +0 -0
  519. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/licenses/LICENSE-jsonhpp +0 -0
  520. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/CMakeLists.txt +0 -0
  521. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-adapter.cpp +0 -0
  522. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-adapter.h +0 -0
  523. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-arch.cpp +0 -0
  524. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-arch.h +0 -0
  525. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-batch.cpp +0 -0
  526. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-batch.h +0 -0
  527. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-chat.cpp +0 -0
  528. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-chat.h +0 -0
  529. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-context.cpp +0 -0
  530. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-context.h +0 -0
  531. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-cparams.cpp +0 -0
  532. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-cparams.h +0 -0
  533. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-ext.h +0 -0
  534. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-grammar.cpp +0 -0
  535. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-grammar.h +0 -0
  536. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-graph.cpp +0 -0
  537. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-graph.h +0 -0
  538. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-hparams.cpp +0 -0
  539. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-hparams.h +0 -0
  540. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-impl.cpp +0 -0
  541. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-impl.h +0 -0
  542. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-io.cpp +0 -0
  543. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-io.h +0 -0
  544. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-kv-cache-iswa.cpp +0 -0
  545. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-kv-cache-iswa.h +0 -0
  546. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-kv-cache.cpp +0 -0
  547. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-kv-cache.h +0 -0
  548. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-kv-cells.h +0 -0
  549. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory-hybrid-iswa.cpp +0 -0
  550. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory-hybrid-iswa.h +0 -0
  551. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory-hybrid.cpp +0 -0
  552. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory-hybrid.h +0 -0
  553. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory-recurrent.cpp +0 -0
  554. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory-recurrent.h +0 -0
  555. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory.cpp +0 -0
  556. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-memory.h +0 -0
  557. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-mmap.cpp +0 -0
  558. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-mmap.h +0 -0
  559. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-model-loader.cpp +0 -0
  560. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-model-loader.h +0 -0
  561. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-model-saver.cpp +0 -0
  562. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-model-saver.h +0 -0
  563. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-model.cpp +0 -0
  564. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-model.h +0 -0
  565. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-quant.cpp +0 -0
  566. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-quant.h +0 -0
  567. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-sampler.cpp +0 -0
  568. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-sampler.h +0 -0
  569. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-vocab.cpp +0 -0
  570. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama-vocab.h +0 -0
  571. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/llama.cpp +0 -0
  572. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/afmoe.cpp +0 -0
  573. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/apertus.cpp +0 -0
  574. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/arcee.cpp +0 -0
  575. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/arctic.cpp +0 -0
  576. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/arwkv7.cpp +0 -0
  577. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/baichuan.cpp +0 -0
  578. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/bailingmoe.cpp +0 -0
  579. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/bailingmoe2.cpp +0 -0
  580. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/bert.cpp +0 -0
  581. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/bitnet.cpp +0 -0
  582. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/bloom.cpp +0 -0
  583. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/chameleon.cpp +0 -0
  584. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/chatglm.cpp +0 -0
  585. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/codeshell.cpp +0 -0
  586. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/cogvlm.cpp +0 -0
  587. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/cohere2-iswa.cpp +0 -0
  588. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/command-r.cpp +0 -0
  589. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/dbrx.cpp +0 -0
  590. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/deci.cpp +0 -0
  591. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/deepseek.cpp +0 -0
  592. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/deepseek2.cpp +0 -0
  593. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/delta-net-base.cpp +0 -0
  594. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/dots1.cpp +0 -0
  595. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/dream.cpp +0 -0
  596. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/ernie4-5-moe.cpp +0 -0
  597. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/ernie4-5.cpp +0 -0
  598. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/eurobert.cpp +0 -0
  599. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/exaone-moe.cpp +0 -0
  600. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/exaone.cpp +0 -0
  601. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/exaone4.cpp +0 -0
  602. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/falcon-h1.cpp +0 -0
  603. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/falcon.cpp +0 -0
  604. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gemma-embedding.cpp +0 -0
  605. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gemma.cpp +0 -0
  606. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gemma2-iswa.cpp +0 -0
  607. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gemma3.cpp +0 -0
  608. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gemma3n-iswa.cpp +0 -0
  609. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gemma4-iswa.cpp +0 -0
  610. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/glm4-moe.cpp +0 -0
  611. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/glm4.cpp +0 -0
  612. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gpt2.cpp +0 -0
  613. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/gptneox.cpp +0 -0
  614. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/granite-hybrid.cpp +0 -0
  615. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/granite.cpp +0 -0
  616. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/grok.cpp +0 -0
  617. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/grovemoe.cpp +0 -0
  618. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/hunyuan-dense.cpp +0 -0
  619. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/hunyuan-moe.cpp +0 -0
  620. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/internlm2.cpp +0 -0
  621. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/jais.cpp +0 -0
  622. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/jais2.cpp +0 -0
  623. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/jamba.cpp +0 -0
  624. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/kimi-linear.cpp +0 -0
  625. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/lfm2.cpp +0 -0
  626. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/llada-moe.cpp +0 -0
  627. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/llada.cpp +0 -0
  628. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/llama-iswa.cpp +0 -0
  629. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/llama.cpp +0 -0
  630. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/maincoder.cpp +0 -0
  631. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/mamba-base.cpp +0 -0
  632. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/mamba.cpp +0 -0
  633. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/mimo2-iswa.cpp +0 -0
  634. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/minicpm3.cpp +0 -0
  635. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/minimax-m2.cpp +0 -0
  636. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/mistral3.cpp +0 -0
  637. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/models.h +0 -0
  638. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/modern-bert.cpp +0 -0
  639. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/mpt.cpp +0 -0
  640. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/nemotron-h.cpp +0 -0
  641. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/nemotron.cpp +0 -0
  642. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/neo-bert.cpp +0 -0
  643. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/olmo.cpp +0 -0
  644. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/olmo2.cpp +0 -0
  645. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/olmoe.cpp +0 -0
  646. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/openai-moe-iswa.cpp +0 -0
  647. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/openelm.cpp +0 -0
  648. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/orion.cpp +0 -0
  649. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/paddleocr.cpp +0 -0
  650. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/pangu-embedded.cpp +0 -0
  651. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/phi2.cpp +0 -0
  652. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/phi3.cpp +0 -0
  653. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/plamo.cpp +0 -0
  654. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/plamo2.cpp +0 -0
  655. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/plamo3.cpp +0 -0
  656. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/plm.cpp +0 -0
  657. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen.cpp +0 -0
  658. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen2.cpp +0 -0
  659. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen2moe.cpp +0 -0
  660. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen2vl.cpp +0 -0
  661. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen3.cpp +0 -0
  662. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen35.cpp +0 -0
  663. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen35moe.cpp +0 -0
  664. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen3moe.cpp +0 -0
  665. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen3next.cpp +0 -0
  666. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen3vl-moe.cpp +0 -0
  667. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/qwen3vl.cpp +0 -0
  668. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/refact.cpp +0 -0
  669. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/rnd1.cpp +0 -0
  670. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/rwkv6-base.cpp +0 -0
  671. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/rwkv6.cpp +0 -0
  672. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/rwkv6qwen2.cpp +0 -0
  673. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/rwkv7-base.cpp +0 -0
  674. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/rwkv7.cpp +0 -0
  675. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/seed-oss.cpp +0 -0
  676. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/smallthinker.cpp +0 -0
  677. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/smollm3.cpp +0 -0
  678. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/stablelm.cpp +0 -0
  679. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/starcoder.cpp +0 -0
  680. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/starcoder2.cpp +0 -0
  681. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/step35-iswa.cpp +0 -0
  682. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/t5-dec.cpp +0 -0
  683. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/t5-enc.cpp +0 -0
  684. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/wavtokenizer-dec.cpp +0 -0
  685. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/models/xverse.cpp +0 -0
  686. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/turbo-rotation-data-32.h +0 -0
  687. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/turbo-rotation-data.h +0 -0
  688. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/unicode-data.cpp +0 -0
  689. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/unicode-data.h +0 -0
  690. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/unicode.cpp +0 -0
  691. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/src/unicode.h +0 -0
  692. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/CMakeLists.txt +0 -0
  693. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/batched-bench/CMakeLists.txt +0 -0
  694. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/batched-bench/batched-bench.cpp +0 -0
  695. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/cli/CMakeLists.txt +0 -0
  696. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/cli/cli.cpp +0 -0
  697. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/completion/CMakeLists.txt +0 -0
  698. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/completion/completion.cpp +0 -0
  699. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/cvector-generator/CMakeLists.txt +0 -0
  700. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/cvector-generator/cvector-generator.cpp +0 -0
  701. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/cvector-generator/mean.hpp +0 -0
  702. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/cvector-generator/pca.hpp +0 -0
  703. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/export-lora/CMakeLists.txt +0 -0
  704. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/export-lora/export-lora.cpp +0 -0
  705. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/fit-params/CMakeLists.txt +0 -0
  706. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/fit-params/fit-params.cpp +0 -0
  707. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/gguf-split/CMakeLists.txt +0 -0
  708. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/gguf-split/gguf-split.cpp +0 -0
  709. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/imatrix/CMakeLists.txt +0 -0
  710. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/imatrix/imatrix.cpp +0 -0
  711. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/llama-bench/CMakeLists.txt +0 -0
  712. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/llama-bench/llama-bench.cpp +0 -0
  713. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/CMakeLists.txt +0 -0
  714. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/clip-graph.h +0 -0
  715. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/clip-impl.h +0 -0
  716. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/clip-model.h +0 -0
  717. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/clip.cpp +0 -0
  718. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/clip.h +0 -0
  719. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/debug/mtmd-debug.cpp +0 -0
  720. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/debug/mtmd-debug.h +0 -0
  721. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/deprecation-warning.cpp +0 -0
  722. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/cogvlm.cpp +0 -0
  723. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/conformer.cpp +0 -0
  724. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/deepseekocr.cpp +0 -0
  725. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/gemma4v.cpp +0 -0
  726. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/glm4v.cpp +0 -0
  727. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/hunyuanocr.cpp +0 -0
  728. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/internvl.cpp +0 -0
  729. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/kimik25.cpp +0 -0
  730. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/kimivl.cpp +0 -0
  731. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/llama4.cpp +0 -0
  732. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/llava.cpp +0 -0
  733. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/minicpmv.cpp +0 -0
  734. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/mobilenetv5.cpp +0 -0
  735. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/models.h +0 -0
  736. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/nemotron-v2-vl.cpp +0 -0
  737. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/paddleocr.cpp +0 -0
  738. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/pixtral.cpp +0 -0
  739. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/qwen2vl.cpp +0 -0
  740. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/qwen3vl.cpp +0 -0
  741. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/siglip.cpp +0 -0
  742. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/whisper-enc.cpp +0 -0
  743. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/models/youtuvl.cpp +0 -0
  744. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-audio.cpp +0 -0
  745. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-audio.h +0 -0
  746. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-cli.cpp +0 -0
  747. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-helper.cpp +0 -0
  748. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-helper.h +0 -0
  749. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-image.cpp +0 -0
  750. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd-image.h +0 -0
  751. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd.cpp +0 -0
  752. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/mtmd/mtmd.h +0 -0
  753. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/parser/CMakeLists.txt +0 -0
  754. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/parser/debug-template-parser.cpp +0 -0
  755. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/parser/template-analysis.cpp +0 -0
  756. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/perplexity/CMakeLists.txt +0 -0
  757. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/perplexity/perplexity.cpp +0 -0
  758. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/quantize/CMakeLists.txt +0 -0
  759. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/quantize/quantize.cpp +0 -0
  760. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/results/CMakeLists.txt +0 -0
  761. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/results/results.cpp +0 -0
  762. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/rpc/CMakeLists.txt +0 -0
  763. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/rpc/rpc-server.cpp +0 -0
  764. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/CMakeLists.txt +0 -0
  765. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-common.cpp +0 -0
  766. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-common.h +0 -0
  767. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-context.cpp +0 -0
  768. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-context.h +0 -0
  769. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-cors-proxy.h +0 -0
  770. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-http.cpp +0 -0
  771. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-http.h +0 -0
  772. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-models.cpp +0 -0
  773. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-models.h +0 -0
  774. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-queue.cpp +0 -0
  775. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-queue.h +0 -0
  776. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-task.cpp +0 -0
  777. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-task.h +0 -0
  778. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-tools.cpp +0 -0
  779. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server-tools.h +0 -0
  780. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/server/server.cpp +0 -0
  781. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/tokenize/CMakeLists.txt +0 -0
  782. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/tokenize/tokenize.cpp +0 -0
  783. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/tts/CMakeLists.txt +0 -0
  784. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/tools/tts/tts.cpp +0 -0
  785. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/cpp-httplib/CMakeLists.txt +0 -0
  786. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/cpp-httplib/httplib.cpp +0 -0
  787. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/cpp-httplib/httplib.h +0 -0
  788. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/miniaudio/miniaudio.h +0 -0
  789. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/nlohmann/json.hpp +0 -0
  790. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/nlohmann/json_fwd.hpp +0 -0
  791. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/sheredom/subprocess.h +0 -0
  792. {localcode-0.2.15 → localcode-0.2.16}/llama-cpp-turboquant/vendor/stb/stb_image.h +0 -0
  793. {localcode-0.2.15 → localcode-0.2.16}/setup.cfg +0 -0
  794. {localcode-0.2.15 → localcode-0.2.16}/setup.py +0 -0
  795. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/__main__.py +0 -0
  796. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/_subproc_env.py +0 -0
  797. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/app_tasks.py +0 -0
  798. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/constants.py +0 -0
  799. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/context.py +0 -0
  800. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/goal.py +0 -0
  801. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/hooks.py +0 -0
  802. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/loop.py +0 -0
  803. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/prompt_context.py +0 -0
  804. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/prompts.py +0 -0
  805. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/recovery.py +0 -0
  806. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/streaming.py +0 -0
  807. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/tool_execution.py +0 -0
  808. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/tool_orchestration.py +0 -0
  809. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/agent/turn_finalization.py +0 -0
  810. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/approvals.py +0 -0
  811. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/auto_compact.py +0 -0
  812. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/bin/__init__.py +0 -0
  813. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/bin/llama-server +0 -0
  814. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/cache.py +0 -0
  815. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/checkpoint.py +0 -0
  816. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/compact.py +0 -0
  817. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/compaction.py +0 -0
  818. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/composer.py +0 -0
  819. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/config.py +0 -0
  820. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/context.py +0 -0
  821. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/display.py +0 -0
  822. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/embeddings.py +0 -0
  823. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/entrypoint.py +0 -0
  824. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/errors.py +0 -0
  825. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/events.py +0 -0
  826. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/features.py +0 -0
  827. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/headless_json.py +0 -0
  828. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/health.py +0 -0
  829. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/hf_quants.py +0 -0
  830. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/history.py +0 -0
  831. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/hooks.py +0 -0
  832. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/indexer.py +0 -0
  833. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/injection_defense.py +0 -0
  834. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/launcher.py +0 -0
  835. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/logging_utils.py +0 -0
  836. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/lsp.py +0 -0
  837. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/mcp.py +0 -0
  838. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/memory_guard.py +0 -0
  839. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/model_config.py +0 -0
  840. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/models.py +0 -0
  841. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/notebook.py +0 -0
  842. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/output.py +0 -0
  843. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/paths.py +0 -0
  844. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/performance.py +0 -0
  845. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/permissions.py +0 -0
  846. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/permissions_v2.py +0 -0
  847. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/recovery.py +0 -0
  848. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/runtime_diffusion.py +0 -0
  849. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/server_manager.py +0 -0
  850. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/session.py +0 -0
  851. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/shell.py +0 -0
  852. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/debug.md +0 -0
  853. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/edit-verified.md +0 -0
  854. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/explain.md +0 -0
  855. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/git-commit-safely.md +0 -0
  856. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/locate.md +0 -0
  857. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/plan-task.md +0 -0
  858. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/review.md +0 -0
  859. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills/run-tests.md +0 -0
  860. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/skills.py +0 -0
  861. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/sounds.py +0 -0
  862. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/thermal.py +0 -0
  863. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/thinking.py +0 -0
  864. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/toolkit.py +0 -0
  865. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/__init__.py +0 -0
  866. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/agent.py +0 -0
  867. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/append_file.py +0 -0
  868. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/base.py +0 -0
  869. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/bash.py +0 -0
  870. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/edit_diff.py +0 -0
  871. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/edit_file.py +0 -0
  872. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/facts.py +0 -0
  873. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/glob_tool.py +0 -0
  874. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/grep.py +0 -0
  875. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/launch_app.py +0 -0
  876. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/list_files.py +0 -0
  877. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/multi_edit.py +0 -0
  878. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/plan_mode.py +0 -0
  879. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/read_file.py +0 -0
  880. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/skill_tool.py +0 -0
  881. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/web_fetch.py +0 -0
  882. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/web_search.py +0 -0
  883. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tools/write_file.py +0 -0
  884. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/__init__.py +0 -0
  885. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/app.py +0 -0
  886. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/bridge.py +0 -0
  887. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/screens/__init__.py +0 -0
  888. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/screens/mode_picker.py +0 -0
  889. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/screens/model_picker.py +0 -0
  890. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/styles/__init__.py +0 -0
  891. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/styles/app.tcss +0 -0
  892. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/widgets/__init__.py +0 -0
  893. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/widgets/approval.py +0 -0
  894. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/widgets/chat_log.py +0 -0
  895. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/widgets/messages/__init__.py +0 -0
  896. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/widgets/messages/diff.py +0 -0
  897. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/tui/widgets/voice_visualizer.py +0 -0
  898. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/turn_diff.py +0 -0
  899. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/undo.py +0 -0
  900. {localcode-0.2.15 → localcode-0.2.16}/src/localcode/voice.py +0 -0
  901. {localcode-0.2.15 → localcode-0.2.16}/src/localcode.egg-info/SOURCES.txt +0 -0
  902. {localcode-0.2.15 → localcode-0.2.16}/src/localcode.egg-info/dependency_links.txt +0 -0
  903. {localcode-0.2.15 → localcode-0.2.16}/src/localcode.egg-info/entry_points.txt +0 -0
  904. {localcode-0.2.15 → localcode-0.2.16}/src/localcode.egg-info/requires.txt +0 -0
  905. {localcode-0.2.15 → localcode-0.2.16}/src/localcode.egg-info/top_level.txt +0 -0
  906. {localcode-0.2.15 → localcode-0.2.16}/tests/test_architecture.py +0 -0
  907. {localcode-0.2.15 → localcode-0.2.16}/tests/test_bootstrap.py +0 -0
  908. {localcode-0.2.15 → localcode-0.2.16}/tests/test_checkpoint.py +0 -0
  909. {localcode-0.2.15 → localcode-0.2.16}/tests/test_churn_detection.py +0 -0
  910. {localcode-0.2.15 → localcode-0.2.16}/tests/test_compaction.py +0 -0
  911. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_agent.py +0 -0
  912. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_bg_download.py +0 -0
  913. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_binary.py +0 -0
  914. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_cli.py +0 -0
  915. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_diffusion.py +0 -0
  916. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_download.py +0 -0
  917. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_hardening.py +0 -0
  918. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_install.py +0 -0
  919. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_machines.py +0 -0
  920. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_model_picker.py +0 -0
  921. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_models_matrix.py +0 -0
  922. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_tui.py +0 -0
  923. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_vision.py +0 -0
  924. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_voice.py +0 -0
  925. {localcode-0.2.15 → localcode-0.2.16}/tests/test_comprehensive_whisper.py +0 -0
  926. {localcode-0.2.15 → localcode-0.2.16}/tests/test_config.py +0 -0
  927. {localcode-0.2.15 → localcode-0.2.16}/tests/test_context.py +0 -0
  928. {localcode-0.2.15 → localcode-0.2.16}/tests/test_context_pipeline_e2e.py +0 -0
  929. {localcode-0.2.15 → localcode-0.2.16}/tests/test_download.py +0 -0
  930. {localcode-0.2.15 → localcode-0.2.16}/tests/test_embeddings_retrieval.py +0 -0
  931. {localcode-0.2.15 → localcode-0.2.16}/tests/test_fresh_install.py +0 -0
  932. {localcode-0.2.15 → localcode-0.2.16}/tests/test_kv_cap.py +0 -0
  933. {localcode-0.2.15 → localcode-0.2.16}/tests/test_model_config.py +0 -0
  934. {localcode-0.2.15 → localcode-0.2.16}/tests/test_models_catalog.py +0 -0
  935. {localcode-0.2.15 → localcode-0.2.16}/tests/test_output.py +0 -0
  936. {localcode-0.2.15 → localcode-0.2.16}/tests/test_prompt_language_steering.py +0 -0
  937. {localcode-0.2.15 → localcode-0.2.16}/tests/test_real_models.py +0 -0
  938. {localcode-0.2.15 → localcode-0.2.16}/tests/test_run_json.py +0 -0
  939. {localcode-0.2.15 → localcode-0.2.16}/tests/test_runtime.py +0 -0
  940. {localcode-0.2.15 → localcode-0.2.16}/tests/test_subproc_env.py +0 -0
  941. {localcode-0.2.15 → localcode-0.2.16}/tests/test_thermal.py +0 -0
  942. {localcode-0.2.15 → localcode-0.2.16}/tests/test_toolkit.py +0 -0
  943. {localcode-0.2.15 → localcode-0.2.16}/tests/test_tui_input.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: localcode
3
- Version: 0.2.15
3
+ Version: 0.2.16
4
4
  Summary: High-performance AI coding on consumer hardware.
5
5
  Author: LocalCode contributors
6
6
  License-Expression: Apache-2.0
@@ -54,7 +54,7 @@ Dynamic: license-file
54
54
  <p align="center">
55
55
  <img src="https://img.shields.io/pypi/v/localcode?style=flat-square&color=7c4dff" alt="PyPI">
56
56
  <img src="https://img.shields.io/badge/license-Apache_2.0-4caf50?style=flat-square" alt="License">
57
- <img src="https://img.shields.io/badge/python-3.11+-3776ab?style=flat-square" alt="Python">
57
+ <img src="https://img.shields.io/badge/python-3.9+-3776ab?style=flat-square" alt="Python">
58
58
  <img src="https://img.shields.io/badge/platform-Apple%20Silicon-999999?style=flat-square" alt="Platform">
59
59
  </p>
60
60
 
@@ -108,7 +108,7 @@ We are building for a world of truly democratized AI — where everyone has acce
108
108
 
109
109
  - **Mac with Apple Silicon**
110
110
  - **16 GB RAM** minimum
111
- - **Python 3.11+**
111
+ - **Python 3.9+**
112
112
  - **~12 GB free disk** (10 GB model + server)
113
113
 
114
114
  ### Tested hardware
@@ -122,18 +122,35 @@ LocalCode is early software. Hardware support is expected to broaden, but only t
122
122
  | M4 Apple Silicon | 24 GB+ | Not yet tested | Expected to support larger contexts, but needs validation |
123
123
  | Intel Mac | Any | Not supported | LocalCode targets Apple Silicon |
124
124
 
125
+ ## Models
126
+
127
+ On launch, LocalCode recommends the best model for **your Mac's RAM** — there's no fixed default. You can pick any of these (or a different quant) in the model picker.
128
+
129
+ | Model | Size (quant) | Active params | Min RAM | Architecture |
130
+ | --- | ---: | --- | ---: | --- |
131
+ | Gemma 4 12B | 7.4 GB (Q4) | 12B (dense) | 16 GB | gemma4-iswa |
132
+ | Gemma 4 26B-A4B | 11.2 GB (Q3) | 3.8B (8/128 experts) | 24 GB | gemma4-iswa |
133
+ | Qwen 3.6 35B-A3B | 10.7 GB (Q2) | 3.0B (8+1/256) | 24 GB | qwen35moe |
134
+ | DiffusionGemma 26B-A4B † | 15.7 GB (Q4) | 4B (diffusion MoE) | 32 GB | diffusion_gemma |
135
+ | North-Mini-Code 30B-A3B † | 17.9 GB (Q4) | 3B (30B MoE) | 36 GB | cohere2_moe |
136
+ | Gemma 4 12B (full) | 23.8 GB (BF16) | 12B (dense) | 48 GB | gemma4-iswa |
137
+ | Gemma 4 26B-A4B | 28 GB (Q8) | 3.8B (8/128 experts) | 64 GB | gemma4-iswa |
138
+ | Qwen 3.6 35B-A3B | 38.5 GB (Q8) | 3.0B (8+1/256) | 96 GB | qwen35moe |
139
+
140
+ *Min RAM* is the threshold for auto-recommendation (weights ≤ ~55% of unified memory, leaving room for KV cache + OS); you can still pick a heavier model manually. **†** experimental — pickable but **not** auto-recommended (DiffusionGemma needs a separate runner; `cohere2_moe` is unvalidated on this stack).
141
+
125
142
  ## How LocalCode works
126
143
 
127
144
  LocalCode runs a custom [llama.cpp](https://github.com/ggerganov/llama.cpp) fork with **TurboQuant KV cache compression** — a technique from Google's ICLR 2026 paper that we patched into llama.cpp for Apple Silicon. This compresses the KV cache 3.8× — fitting 32K context in 355 MiB on a 16 GB MacBook.
128
145
 
129
- The default model (**Gemma 4 26B-A4B**) is a Mixture-of-Experts architecture 25.2 B total parameters but only 3.8 B active per token. That's what makes ~27 tok/s possible on a laptop.
146
+ LocalCode picks a model based on **your Mac's RAM** — there's no fixed default. It scales from Gemma 4 12B on 16 GB up to Qwen 3.6 35B-A3B on 64 GB+. The recommended models are Mixture-of-Experts — only ~3.8 B parameters active per token which is what makes ~27 tok/s possible on a laptop.
130
147
 
131
148
  Under the hood:
132
149
 
133
150
  - **TurboQuant KV cache** — asymmetric q8\_0-K + turbo4-V quantization, 3.8× compression vs. f16
134
151
  - **Multi-region mmap patch** — fixes a Metal OOM crash where llama.cpp's loader spanned the entire GGUF file into one Metal buffer
135
152
  - **GPU memory unlock** — auto-prompts to raise `iogpu.wired_limit_mb` for full Metal offload
136
- - **Agent loop** — phased CREATE/EDIT/CHAT/RUN/SEARCH routing with task state, evidence-driven completion, and recovery modes for small-model failure patterns
153
+ - **Agent loop** — goal-typed routing (build / edit / run / chat) with task state, evidence-driven completion, and recovery modes for small-model failure patterns
137
154
 
138
155
  ## Sponsors
139
156
 
@@ -9,7 +9,7 @@
9
9
  <p align="center">
10
10
  <img src="https://img.shields.io/pypi/v/localcode?style=flat-square&color=7c4dff" alt="PyPI">
11
11
  <img src="https://img.shields.io/badge/license-Apache_2.0-4caf50?style=flat-square" alt="License">
12
- <img src="https://img.shields.io/badge/python-3.11+-3776ab?style=flat-square" alt="Python">
12
+ <img src="https://img.shields.io/badge/python-3.9+-3776ab?style=flat-square" alt="Python">
13
13
  <img src="https://img.shields.io/badge/platform-Apple%20Silicon-999999?style=flat-square" alt="Platform">
14
14
  </p>
15
15
 
@@ -63,7 +63,7 @@ We are building for a world of truly democratized AI — where everyone has acce
63
63
 
64
64
  - **Mac with Apple Silicon**
65
65
  - **16 GB RAM** minimum
66
- - **Python 3.11+**
66
+ - **Python 3.9+**
67
67
  - **~12 GB free disk** (10 GB model + server)
68
68
 
69
69
  ### Tested hardware
@@ -77,18 +77,35 @@ LocalCode is early software. Hardware support is expected to broaden, but only t
77
77
  | M4 Apple Silicon | 24 GB+ | Not yet tested | Expected to support larger contexts, but needs validation |
78
78
  | Intel Mac | Any | Not supported | LocalCode targets Apple Silicon |
79
79
 
80
+ ## Models
81
+
82
+ On launch, LocalCode recommends the best model for **your Mac's RAM** — there's no fixed default. You can pick any of these (or a different quant) in the model picker.
83
+
84
+ | Model | Size (quant) | Active params | Min RAM | Architecture |
85
+ | --- | ---: | --- | ---: | --- |
86
+ | Gemma 4 12B | 7.4 GB (Q4) | 12B (dense) | 16 GB | gemma4-iswa |
87
+ | Gemma 4 26B-A4B | 11.2 GB (Q3) | 3.8B (8/128 experts) | 24 GB | gemma4-iswa |
88
+ | Qwen 3.6 35B-A3B | 10.7 GB (Q2) | 3.0B (8+1/256) | 24 GB | qwen35moe |
89
+ | DiffusionGemma 26B-A4B † | 15.7 GB (Q4) | 4B (diffusion MoE) | 32 GB | diffusion_gemma |
90
+ | North-Mini-Code 30B-A3B † | 17.9 GB (Q4) | 3B (30B MoE) | 36 GB | cohere2_moe |
91
+ | Gemma 4 12B (full) | 23.8 GB (BF16) | 12B (dense) | 48 GB | gemma4-iswa |
92
+ | Gemma 4 26B-A4B | 28 GB (Q8) | 3.8B (8/128 experts) | 64 GB | gemma4-iswa |
93
+ | Qwen 3.6 35B-A3B | 38.5 GB (Q8) | 3.0B (8+1/256) | 96 GB | qwen35moe |
94
+
95
+ *Min RAM* is the threshold for auto-recommendation (weights ≤ ~55% of unified memory, leaving room for KV cache + OS); you can still pick a heavier model manually. **†** experimental — pickable but **not** auto-recommended (DiffusionGemma needs a separate runner; `cohere2_moe` is unvalidated on this stack).
96
+
80
97
  ## How LocalCode works
81
98
 
82
99
  LocalCode runs a custom [llama.cpp](https://github.com/ggerganov/llama.cpp) fork with **TurboQuant KV cache compression** — a technique from Google's ICLR 2026 paper that we patched into llama.cpp for Apple Silicon. This compresses the KV cache 3.8× — fitting 32K context in 355 MiB on a 16 GB MacBook.
83
100
 
84
- The default model (**Gemma 4 26B-A4B**) is a Mixture-of-Experts architecture 25.2 B total parameters but only 3.8 B active per token. That's what makes ~27 tok/s possible on a laptop.
101
+ LocalCode picks a model based on **your Mac's RAM** — there's no fixed default. It scales from Gemma 4 12B on 16 GB up to Qwen 3.6 35B-A3B on 64 GB+. The recommended models are Mixture-of-Experts — only ~3.8 B parameters active per token which is what makes ~27 tok/s possible on a laptop.
85
102
 
86
103
  Under the hood:
87
104
 
88
105
  - **TurboQuant KV cache** — asymmetric q8\_0-K + turbo4-V quantization, 3.8× compression vs. f16
89
106
  - **Multi-region mmap patch** — fixes a Metal OOM crash where llama.cpp's loader spanned the entire GGUF file into one Metal buffer
90
107
  - **GPU memory unlock** — auto-prompts to raise `iogpu.wired_limit_mb` for full Metal offload
91
- - **Agent loop** — phased CREATE/EDIT/CHAT/RUN/SEARCH routing with task state, evidence-driven completion, and recovery modes for small-model failure patterns
108
+ - **Agent loop** — goal-typed routing (build / edit / run / chat) with task state, evidence-driven completion, and recovery modes for small-model failure patterns
92
109
 
93
110
  ## Sponsors
94
111
 
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "localcode"
7
- version = "0.2.15"
7
+ version = "0.2.16"
8
8
  description = "High-performance AI coding on consumer hardware."
9
9
  readme = "README.md"
10
10
  requires-python = ">=3.9"
@@ -1,3 +1,3 @@
1
1
  __all__ = ["__version__"]
2
2
 
3
- __version__ = "0.2.15"
3
+ __version__ = "0.2.16"
@@ -16,7 +16,7 @@ re-exported here so external callers can continue to import from
16
16
  Background: before T0.1, agent.py was a 1792-line monolith. The split
17
17
  broke it into focused modules (each ≤ ~720 LoC), with __init__.py
18
18
  reduced to this re-export surface — well under the 400-LoC cap the
19
- plan sets for god modules (see eval/OPTIMIZATION_PLAN.md § T0).
19
+ plan sets for god modules (see dev/eval/OPTIMIZATION_PLAN.md § T0).
20
20
 
21
21
  Unused-import warnings in this file are expected — every imported
22
22
  name is intentionally re-exported. The `# noqa: F401` comments
@@ -140,7 +140,7 @@ from .helpers import ( # noqa: F401
140
140
 
141
141
  # ── Prompt templates + project-instructions loader ────────────────────────
142
142
  # Moved to agent/prompts.py during the T0.1-b split. Re-exported here so
143
- # external callers (eval/prompt_variants.py, tests/promptfoo, app.py,
143
+ # external callers (dev/eval/prompt_variants.py, tests/promptfoo, app.py,
144
144
  # tests/test_context_pipeline_e2e.py) that do
145
145
  # `from localcode.agent import SYSTEM_PROMPT`
146
146
  # keep working unchanged. See agent/prompts.py for the commented
@@ -160,7 +160,6 @@ from .prompts import ( # noqa: F401 — re-exports for back-compat
160
160
  # and the dispatcher (for _execute_tool). Plan-mode gating still lives
161
161
  # here because it's cross-tool policy, not tool-specific logic.
162
162
 
163
- from ..tools import ALL_SCHEMAS as TOOL_SCHEMAS # for agent-loop tool registry injection
164
163
 
165
164
 
166
165
  # ── Result Management ────────────────────────────────────────────────────
@@ -53,16 +53,6 @@ __all__: list[str] = []
53
53
  _SHRINK_GUARD_SOURCE_EXTS = {".py", ".js", ".jsx", ".ts", ".tsx", ".css", ".html"}
54
54
 
55
55
 
56
- def _canonical_creation_root(app: "LocalCodeApp") -> Path | None:
57
- task = getattr(getattr(app, "session", None), "current_task", None)
58
- if getattr(task, "task_kind", "") != "new_app":
59
- return None
60
- slug = str(getattr(task, "task_slug", "") or "").strip()
61
- if not slug:
62
- return None
63
- return (app.repo_root / slug).resolve()
64
-
65
-
66
56
  def _path_within(path: Path, root: Path) -> bool:
67
57
  try:
68
58
  path.resolve().relative_to(root)
@@ -14,14 +14,14 @@ Problems with the monolith:
14
14
  session, which means every new session re-evaluates the whole
15
15
  prompt. Our benchmark shows prompt_ms of ~48 ms warm; the
16
16
  theoretical floor with a stable prefix cache is ~5-10 ms.
17
- • No way to A/B sections individually. `eval/prompt_variants.py`
17
+ • No way to A/B sections individually. `dev/eval/prompt_variants.py`
18
18
  only supports coarse "strip rule N" mutations. You can't
19
19
  answer "what if we drop the build-app rules for debugging
20
20
  tasks?" because there's no boundary between them.
21
21
  • No way to gate sections on trigger phrases. Every session ships
22
22
  rule 10 (open browser) whether or not a web app is in scope.
23
23
 
24
- This module is **Phase 1** of T0.11 (see eval/OPTIMIZATION_PLAN.md):
24
+ This module is **Phase 1** of T0.11 (see dev/eval/OPTIMIZATION_PLAN.md):
25
25
  introduce the section-registry concept with behaviour-neutral
26
26
  defaults. The composer produces the same output as the old
27
27
  `SYSTEM_PROMPT.format(...)` for the default all-sections-on case.
@@ -55,11 +55,9 @@ work is an add-only operation.
55
55
  from __future__ import annotations
56
56
 
57
57
  from dataclasses import dataclass
58
- from pathlib import Path
59
58
  from typing import Callable
60
59
 
61
60
  from .prompts import SYSTEM_PROMPT
62
- from .prompts import _load_project_instructions
63
61
 
64
62
 
65
63
  __all__ = [
@@ -241,10 +239,3 @@ def compose_system_prompt(
241
239
  parts.insert(-1, CACHE_BOUNDARY_MARKER)
242
240
 
243
241
  return "".join(parts)
244
-
245
-
246
- def load_project_instructions(repo_root: Path) -> str:
247
- """Convenience re-export so callers outside agent/ that don't
248
- want to depend on `agent.prompts` internals can build a
249
- SectionContext purely from this module."""
250
- return _load_project_instructions(repo_root)
@@ -4,7 +4,6 @@ from concurrent.futures import ThreadPoolExecutor, as_completed
4
4
  from dataclasses import replace
5
5
  import logging
6
6
  from pathlib import Path
7
- import re
8
7
 
9
8
  from rich.console import Console
10
9
  from rich.panel import Panel
@@ -41,7 +40,7 @@ from .autonomy import AutonomyLevel, apply_autonomy_to_permissions, get_policy
41
40
  from .hooks import HookRunner
42
41
  from .snapshots import SnapshotStore, create_snapshot
43
42
  from .turn_diff import TurnDiffTracker, print_turn_diff
44
- from .agent.goal import GoalState, infer_goal_state
43
+ from .agent.goal import infer_goal_state
45
44
  from .performance import detect_machine_profile, benchmark_report, apply_preset, should_promote_legacy_default_to_laptop_26b
46
45
 
47
46
 
@@ -62,67 +61,6 @@ _FOLLOWUP_CHAT_ONLY = {
62
61
  _CODING_TASK_KINDS = {"new_app", "existing_app_edit", "run_or_launch"}
63
62
 
64
63
 
65
- def _looks_like_task_followup(user_text: str, current_task: object | None) -> bool:
66
- """Return true when a short correction should continue the task.
67
-
68
- This is deliberately conservative: it only attaches to a coding task
69
- and only for short correction/addition wording. The actual feature
70
- remains model/tool-driven; LocalCode does not classify domain terms.
71
- """
72
- if current_task is None:
73
- return False
74
- if getattr(current_task, "task_kind", "") not in _CODING_TASK_KINDS:
75
- return False
76
- text = (user_text or "").strip().lower()
77
- if not text:
78
- return False
79
- first = next(iter(re.findall(r"[a-z0-9]+", text)), "")
80
- if text in _FOLLOWUP_CHAT_ONLY:
81
- return False
82
- if len(text) <= 80 and "?" not in text and first not in {"what", "why", "how", "where", "when", "who"}:
83
- return True
84
- return any(
85
- phrase in text
86
- for phrase in (
87
- "i meant",
88
- "you forgot",
89
- "missing",
90
- "add ",
91
- "also add",
92
- "it should",
93
- "should have",
94
- "doesn't have",
95
- "didn't add",
96
- )
97
- )
98
-
99
-
100
- def _continue_goal_for_task_followup(goal_state: GoalState, user_text: str, current_task: object) -> GoalState:
101
- criteria = list(getattr(current_task, "success_criteria", []) or goal_state.success_criteria)
102
- criteria.extend([
103
- "Follow-up correction is implemented in the existing task context",
104
- "Assistant does not stop with a permission question when the requested implementation is local and feasible",
105
- ])
106
- current_kind = getattr(current_task, "task_kind", goal_state.task_kind)
107
- if current_kind in {"new_app", "existing_app_edit"}:
108
- goal_type = "edit_existing"
109
- task_kind = "existing_app_edit"
110
- else:
111
- goal_type = getattr(current_task, "goal_type", goal_state.goal_type)
112
- task_kind = current_kind
113
- # Preserve task identity; this turn is a correction on existing work,
114
- # not a fresh task name.
115
- return replace(
116
- goal_state,
117
- goal_type=goal_type,
118
- task_kind=task_kind,
119
- task_slug=getattr(current_task, "task_slug", goal_state.task_slug),
120
- goal_summary=f"{getattr(current_task, 'goal_summary', '')}\nFollow-up: {user_text}".strip()[:240],
121
- success_criteria=tuple(dict.fromkeys(criteria)),
122
- allows_blocking_question=False,
123
- )
124
-
125
-
126
64
  def _canonical_project_dir_has_files(repo_root: Path, slug: str) -> bool:
127
65
  """True when a creation task's canonical project directory already exists.
128
66
 
@@ -101,18 +101,3 @@ def apply_autonomy_to_permissions(permissions, policy: AutonomyPolicy) -> None:
101
101
 
102
102
  if policy.level == AutonomyLevel.FULL_AUTO:
103
103
  permissions.approve_all()
104
-
105
-
106
- def format_autonomy_status(level: AutonomyLevel) -> str:
107
- """Format current autonomy level for display."""
108
- policy = POLICIES[level]
109
- icons = {True: "✓", False: "✗"}
110
- return (
111
- f"Autonomy: {level.value}\n"
112
- f" {policy.description}\n"
113
- f" reads: {icons[policy.auto_approve_reads]}\n"
114
- f" writes: {icons[policy.auto_approve_writes]}\n"
115
- f" bash: {icons[policy.auto_approve_bash]}\n"
116
- f" installs: {icons[policy.auto_approve_installs]}\n"
117
- f" git: {icons[policy.auto_approve_git]}"
118
- )
@@ -539,13 +539,16 @@ def download_model(
539
539
  ) -> tuple[bool, str]:
540
540
  """Download a GGUF model selected from `models_catalog.CHOICES`.
541
541
 
542
- If `choice` is None, defaults to the first entry in CHOICES (Gemma 4 26B).
542
+ If `choice` is None, falls back to `recommend()` the RAM-appropriate model
543
+ for this machine, not a hardcoded default.
543
544
  Returns (success, path_or_error_message).
544
545
  """
545
- from .models_catalog import CHOICES
546
+ from .models_catalog import recommend
546
547
 
547
548
  if choice is None:
548
- choice = CHOICES[0]
549
+ # No explicit choice the RAM-appropriate model for THIS machine,
550
+ # not a hardcoded default.
551
+ choice = recommend()
549
552
 
550
553
  # Already present?
551
554
  existing = get_model_path(choice.filename)
@@ -1247,18 +1250,6 @@ def _ensure_ollama() -> bool:
1247
1250
  return result.returncode == 0
1248
1251
 
1249
1252
 
1250
- def ensure_model_downloaded(model_tag: str, on_progress: Callable[[str], None] | None = None) -> tuple[bool, str]:
1251
- """Ensure the model is downloaded via Ollama. Installs Ollama if needed."""
1252
- if not _ensure_ollama():
1253
- return False, "Could not install Ollama. Install manually: https://ollama.com/download"
1254
- # Start Ollama service if not running
1255
- if platform.system().lower() == "darwin":
1256
- subprocess.Popen(["ollama", "serve"], stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL,
1257
- start_new_session=True)
1258
- import time; time.sleep(2)
1259
- return pull_model(model_tag, on_progress=on_progress)
1260
-
1261
-
1262
1253
  def build_turboquant(on_progress: Callable[[str], None] | None = None) -> tuple[bool, str]:
1263
1254
  """Build the TurboQuant llama.cpp fork from source with Metal support."""
1264
1255
  source = _find_turboquant_source()
@@ -56,15 +56,6 @@ def truncate_with_tail(
56
56
  return "\n".join(head_block + [ellipsis] + tail_block)
57
57
 
58
58
 
59
- def truncate_one_line(text: str, max_chars: int = 80) -> str:
60
- """Truncate to a single line for inline display (e.g. tool-call
61
- args summary). Replaces newlines with spaces, hard-caps length."""
62
- s = (text or "").replace("\n", " ").strip()
63
- if len(s) <= max_chars:
64
- return s
65
- return s[: max_chars - 1] + "…"
66
-
67
-
68
59
  def split_stdout_stderr(text: str) -> tuple[str, str]:
69
60
  """Heuristic split of bash output into (stdout, stderr).
70
61
 
@@ -31,7 +31,7 @@ Scope we DO NOT cover here:
31
31
  override yet).
32
32
  - Prompt rendering differences — the SYSTEM_PROMPT content itself
33
33
  is still one string, and word-level per-family variants would live
34
- in eval/prompt_variants.py, not here.
34
+ in dev/eval/prompt_variants.py, not here.
35
35
  """
36
36
  from __future__ import annotations
37
37
 
@@ -319,25 +319,57 @@ def _system_ram_gb() -> int:
319
319
  return 16
320
320
 
321
321
 
322
+ # Architectures we never AUTO-recommend (users can still pick them explicitly in
323
+ # the model picker): diffusion needs a separate one-shot runner — not the
324
+ # standard llama-server — and cohere2_moe is unvalidated on this stack.
325
+ _NO_AUTO_RECOMMEND_ARCHS = {"diffusion_gemma", "cohere2_moe"}
326
+
327
+ # Capability order for auto-recommend, best → worst for coding-agent use. This
328
+ # is deliberately NOT raw file size: the big MoEs measure ~95% HumanEval here
329
+ # (even at low bit) and must outrank the 12B dense, and a higher-bit quant of a
330
+ # family wins. A 12B-BF16 must never be recommended over a 26B/35B MoE just
331
+ # because its file happens to be larger.
332
+ _RECOMMEND_ORDER = [
333
+ "qwen-q8", # 35B-A3B MoE, near-lossless Q8
334
+ "gemma-q8", # 26B-A4B MoE, near-lossless Q8
335
+ "qwen", # 35B-A3B MoE Q2 — 94.7% HumanEval
336
+ "gemma", # 26B-A4B MoE Q3 — 95.1% HumanEval
337
+ "gemma-12b-bf16", # 12B dense, full precision
338
+ "gemma-12b", # 12B dense Q4
339
+ ]
340
+
341
+
342
+ def _capability_rank(choice) -> int:
343
+ """Lower = more capable. Curated models first; any other production model
344
+ sorts after them — so a newly-added quant is still recommendable, but never
345
+ outranks a curated MoE."""
346
+ order = {k: i for i, k in enumerate(_RECOMMEND_ORDER)}
347
+ return order.get(choice.key, len(_RECOMMEND_ORDER) + 1)
348
+
349
+
322
350
  def recommend(ram_gb: int | None = None) -> ModelChoice:
323
- """Pick the catalog entry best suited to the host's RAM.
351
+ """Pick the best model for THIS machine's RAM — capability-ranked, never an
352
+ experimental architecture, and never a hardcoded default.
324
353
 
325
- Rule of thumb: model weights + KV + OS headroom should fit in ~70% of
326
- unified memory. We bias conservatively being slightly under-quantized
327
- is worse than crashing on load. Falls back to the first entry if nothing
328
- matches (shouldn't happen with the current catalog).
354
+ Weights must fit in ~55% of unified memory (leaves room for KV cache,
355
+ activations, OS). Among the production-ready models that fit, return the
356
+ most capable (see ``_RECOMMEND_ORDER``) so the recommendation scales with
357
+ the user's hardware instead of defaulting to any one model.
329
358
  """
330
359
  if ram_gb is None:
331
360
  ram_gb = _system_ram_gb()
332
- # Sort candidates by size_gb; pick the biggest whose weights fit
333
- # in ~55% of RAM (leaves room for KV cache, activations, OS).
334
361
  budget = ram_gb * 0.55
335
- fits = [c for c in CHOICES if c.size_gb <= budget]
336
- if fits:
337
- return max(fits, key=lambda c: c.size_gb)
338
- # Nothing fits the budget — return the smallest entry so at least
339
- # something is suggested rather than a recommendation the user can't run.
340
- return min(CHOICES, key=lambda c: c.size_gb)
362
+ candidates = [
363
+ c for c in CHOICES
364
+ if c.architecture not in _NO_AUTO_RECOMMEND_ARCHS and c.size_gb <= budget
365
+ ]
366
+ if candidates:
367
+ # Most capable that fits; tie-break toward the larger (better-quant) file.
368
+ return min(candidates, key=lambda c: (_capability_rank(c), -c.size_gb))
369
+ # Nothing fits the budget — smallest production-ready model so the user still
370
+ # gets something runnable rather than an impossible recommendation.
371
+ prod = [c for c in CHOICES if c.architecture not in _NO_AUTO_RECOMMEND_ARCHS]
372
+ return min(prod or CHOICES, key=lambda c: c.size_gb)
341
373
 
342
374
 
343
375
  def by_key(key: str) -> ModelChoice | None:
@@ -404,39 +436,6 @@ def current(config) -> ModelChoice | None:
404
436
  return by_filename(name)
405
437
 
406
438
 
407
- def format_choice_long(c: ModelChoice, *, downloaded: bool, current_marker: bool = False) -> str:
408
- """Multi-line formatted description for the picker UI."""
409
- marker = " (current)" if current_marker else ""
410
- status = "downloaded" if downloaded else f"will download {c.size_gb:.1f} GB"
411
- if c.humaneval_pass_at_1 is not None:
412
- bench = f"{c.humaneval_pass_at_1*100:.1f}% HumanEval pass@1 (measured on this stack)"
413
- else:
414
- bench = "no benchmark (untested on this stack)"
415
- # Warn if this model is too big for the current Mac's RAM budget.
416
- # Short inline warning; the picker screen also dims models with a
417
- # bad fit so users can see at a glance.
418
- try:
419
- from .health import estimate_fit
420
- fits, reason = estimate_fit(c.size_gb)
421
- except Exception:
422
- fits, reason = True, ""
423
- fit_line = "" if fits else f" ⚠ fit: {reason}\n"
424
- return (
425
- f"[{c.key}] {c.name}{marker}\n"
426
- f" source: {c.hf_repo}\n"
427
- f" url: {c.hf_url}\n"
428
- f" filename: {c.filename}\n"
429
- f" size: {c.size_gb:.1f} GB ({status})\n"
430
- f"{fit_line}"
431
- f" active: {c.active_params}\n"
432
- f" arch: {c.architecture}\n"
433
- f" license: {c.license}\n"
434
- f" benchmark: {bench}\n"
435
- f" download path: {c.local_path}\n"
436
- f" note: {c.notes}"
437
- )
438
-
439
-
440
439
  # ---------------------------------------------------------------------------
441
440
  # Curated MODEL-GROUP layer (ADDITIVE — built on top of the catalog above).
442
441
  #
@@ -1,9 +1,6 @@
1
1
  from __future__ import annotations
2
2
 
3
3
  import re
4
- import subprocess
5
- import tempfile
6
- from pathlib import Path
7
4
  from dataclasses import dataclass
8
5
 
9
6
 
@@ -24,13 +21,6 @@ class DiffFile:
24
21
  hunks: list[DiffHunk]
25
22
 
26
23
 
27
- def extract_last_diff_block(text: str) -> str | None:
28
- matches = DIFF_BLOCK_RE.findall(text)
29
- if not matches:
30
- return None
31
- return matches[-1].strip()
32
-
33
-
34
24
  def parse_diff(diff_text: str) -> list[DiffFile]:
35
25
  files: list[DiffFile] = []
36
26
  current: DiffFile | None = None
@@ -73,18 +63,3 @@ def build_diff(selected_files: list[DiffFile]) -> str:
73
63
  blocks.append(hunk.header)
74
64
  blocks.extend(hunk.lines)
75
65
  return "\n".join(blocks) + ("\n" if blocks else "")
76
-
77
-
78
- def apply_diff(repo_root: Path, diff_text: str) -> tuple[bool, str]:
79
- with tempfile.NamedTemporaryFile("w", suffix=".diff", delete=False) as handle:
80
- handle.write(diff_text)
81
- patch_path = Path(handle.name)
82
- result = subprocess.run(
83
- ["git", "apply", "--reject", "--whitespace=nowarn", str(patch_path)],
84
- cwd=repo_root,
85
- capture_output=True,
86
- text=True,
87
- check=False,
88
- )
89
- output = (result.stdout + "\n" + result.stderr).strip()
90
- return result.returncode == 0, output or "Patch applied."
@@ -104,14 +104,6 @@ def read_plan(slug: str) -> str | None:
104
104
  return None
105
105
 
106
106
 
107
- def write_plan(slug: str, content: str) -> Path:
108
- """Persist the plan. Returns the path on disk so callers can surface it."""
109
- ensure_plans_dir()
110
- p = plan_path(slug)
111
- p.write_text(content, encoding="utf-8")
112
- return p
113
-
114
-
115
107
  def new_slug() -> str:
116
108
  """Generate a fresh slug, retrying up to 10 times if a file already
117
109
  exists (very unlikely but keeps us honest)."""
@@ -151,26 +151,6 @@ def process_summary(repo_root: Path | str) -> str:
151
151
  return "\n".join(lines)
152
152
 
153
153
 
154
- def stop_all_records(repo_root: Path | str) -> str:
155
- records = load_records(repo_root)
156
- if not records:
157
- return "No LocalCode-managed processes recorded."
158
- stopped = 0
159
- skipped = 0
160
- for record in list(records):
161
- if record.stopped_at:
162
- skipped += 1
163
- continue
164
- if record.pid <= 0 or not _pid_alive(record.pid):
165
- skipped += 1
166
- continue
167
- if stop_record(repo_root, record):
168
- stopped += 1
169
- else:
170
- skipped += 1
171
- return f"Stopped {stopped} LocalCode-managed process group(s). Skipped {skipped}."
172
-
173
-
174
154
  def _pid_alive(pid: int) -> bool:
175
155
  try:
176
156
  os.kill(pid, 0)
@@ -1,6 +1,6 @@
1
1
  """Per-machine model launch recommendations — the output of the model-opt loop.
2
2
 
3
- The offline optimizer (eval/model_opt.py) sweeps quants/params, scores each
3
+ The offline optimizer (dev/eval/model_opt.py) sweeps quants/params, scores each
4
4
  combo on the eval suite, and writes the winner here. At launch,
5
5
  ``runtime.llama_server_command`` consults ``load_overrides`` so the tuned
6
6
  params are applied automatically.
@@ -217,7 +217,7 @@ class StreamEvent(dict):
217
217
  def apply_param_overrides(cmd: list[str], env: dict | None = None) -> list[str]:
218
218
  """Rewrite llama-server flags from ``LOCALCODE_OVERRIDE_*`` env vars.
219
219
 
220
- Lets the offline model-optimizer (eval/model_opt.py) sweep launch
220
+ Lets the offline model-optimizer (dev/eval/model_opt.py) sweep launch
221
221
  parameters — GPU layers, context size, threads, batch — WITHOUT editing
222
222
  config or the catalog. Only flags already present in ``cmd`` are
223
223
  rewritten; an unset env var leaves the command untouched, so the default
@@ -193,21 +193,3 @@ def create_snapshot(session_id: str, repo_root: str, messages: list[dict],
193
193
  store = SnapshotStore()
194
194
  store.save(snapshot)
195
195
  return snapshot
196
-
197
-
198
- def restore_snapshot(snapshot: GhostSnapshot) -> dict:
199
- """Restore file system state from a snapshot.
200
-
201
- Returns dict of files restored.
202
- """
203
- restored = {}
204
- root = Path(snapshot.repo_root)
205
- for rel_path, content in snapshot.file_snapshots.items():
206
- full = root / rel_path
207
- try:
208
- full.parent.mkdir(parents=True, exist_ok=True)
209
- full.write_text(content)
210
- restored[rel_path] = "restored"
211
- except Exception as e:
212
- restored[rel_path] = f"error: {e}"
213
- return restored