llama-cpp-pydist 0.17.0__py3-none-any.whl → 0.19.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (368) hide show
  1. llama_cpp/binaries/{llama-b7278-bin-win-cpu-x64.zip → llama-b7488-bin-win-cpu-x64.zip} +0 -0
  2. llama_cpp_pydist-0.19.0.dist-info/METADATA +2506 -0
  3. {llama_cpp_pydist-0.17.0.dist-info → llama_cpp_pydist-0.19.0.dist-info}/RECORD +365 -302
  4. scripts/generate_changelog.py +10 -0
  5. vendor_llama_cpp_pydist/llama.cpp/.devops/cann.Dockerfile +3 -3
  6. vendor_llama_cpp_pydist/llama.cpp/.devops/cpu.Dockerfile +1 -1
  7. vendor_llama_cpp_pydist/llama.cpp/.devops/cuda.Dockerfile +1 -1
  8. vendor_llama_cpp_pydist/llama.cpp/.devops/intel.Dockerfile +1 -1
  9. vendor_llama_cpp_pydist/llama.cpp/.devops/llama-cli-cann.Dockerfile +3 -2
  10. vendor_llama_cpp_pydist/llama.cpp/.devops/llama-cpp-cuda.srpm.spec +2 -0
  11. vendor_llama_cpp_pydist/llama.cpp/.devops/llama-cpp.srpm.spec +2 -0
  12. vendor_llama_cpp_pydist/llama.cpp/.devops/musa.Dockerfile +1 -1
  13. vendor_llama_cpp_pydist/llama.cpp/.devops/rocm.Dockerfile +1 -1
  14. vendor_llama_cpp_pydist/llama.cpp/.devops/s390x.Dockerfile +1 -1
  15. vendor_llama_cpp_pydist/llama.cpp/.devops/tools.sh +6 -2
  16. vendor_llama_cpp_pydist/llama.cpp/.devops/vulkan.Dockerfile +1 -1
  17. vendor_llama_cpp_pydist/llama.cpp/.github/ISSUE_TEMPLATE/011-bug-results.yml +6 -3
  18. vendor_llama_cpp_pydist/llama.cpp/.github/ISSUE_TEMPLATE/019-bug-misc.yml +1 -0
  19. vendor_llama_cpp_pydist/llama.cpp/.github/actions/windows-setup-cuda/action.yml +31 -0
  20. vendor_llama_cpp_pydist/llama.cpp/.github/workflows/build-linux-cross.yml +1 -0
  21. vendor_llama_cpp_pydist/llama.cpp/.github/workflows/build.yml +77 -17
  22. vendor_llama_cpp_pydist/llama.cpp/.github/workflows/release.yml +89 -44
  23. vendor_llama_cpp_pydist/llama.cpp/.github/workflows/server-webui.yml +225 -0
  24. vendor_llama_cpp_pydist/llama.cpp/.github/workflows/server.yml +0 -264
  25. vendor_llama_cpp_pydist/llama.cpp/.gitignore +1 -0
  26. vendor_llama_cpp_pydist/llama.cpp/CODEOWNERS +3 -2
  27. vendor_llama_cpp_pydist/llama.cpp/CONTRIBUTING.md +2 -1
  28. vendor_llama_cpp_pydist/llama.cpp/README.md +6 -16
  29. vendor_llama_cpp_pydist/llama.cpp/SECURITY.md +3 -0
  30. vendor_llama_cpp_pydist/llama.cpp/ci/run.sh +18 -12
  31. vendor_llama_cpp_pydist/llama.cpp/common/CMakeLists.txt +2 -0
  32. vendor_llama_cpp_pydist/llama.cpp/common/arg.cpp +530 -240
  33. vendor_llama_cpp_pydist/llama.cpp/common/arg.h +52 -2
  34. vendor_llama_cpp_pydist/llama.cpp/common/chat-parser-xml-toolcall.cpp +36 -18
  35. vendor_llama_cpp_pydist/llama.cpp/common/chat-parser-xml-toolcall.h +1 -1
  36. vendor_llama_cpp_pydist/llama.cpp/common/chat-parser.cpp +3 -2
  37. vendor_llama_cpp_pydist/llama.cpp/common/chat-peg-parser.cpp +12 -2
  38. vendor_llama_cpp_pydist/llama.cpp/common/chat.cpp +272 -0
  39. vendor_llama_cpp_pydist/llama.cpp/common/common.cpp +156 -67
  40. vendor_llama_cpp_pydist/llama.cpp/common/common.h +51 -17
  41. vendor_llama_cpp_pydist/llama.cpp/common/console.cpp +680 -47
  42. vendor_llama_cpp_pydist/llama.cpp/common/console.h +30 -8
  43. vendor_llama_cpp_pydist/llama.cpp/common/download.cpp +69 -25
  44. vendor_llama_cpp_pydist/llama.cpp/common/json-schema-to-grammar.cpp +132 -3
  45. vendor_llama_cpp_pydist/llama.cpp/common/json-schema-to-grammar.h +20 -0
  46. vendor_llama_cpp_pydist/llama.cpp/common/log.cpp +8 -26
  47. vendor_llama_cpp_pydist/llama.cpp/common/log.h +1 -0
  48. vendor_llama_cpp_pydist/llama.cpp/common/peg-parser.cpp +1 -1
  49. vendor_llama_cpp_pydist/llama.cpp/common/preset.cpp +398 -0
  50. vendor_llama_cpp_pydist/llama.cpp/common/preset.h +74 -0
  51. vendor_llama_cpp_pydist/llama.cpp/common/sampling.cpp +67 -54
  52. vendor_llama_cpp_pydist/llama.cpp/common/sampling.h +8 -0
  53. vendor_llama_cpp_pydist/llama.cpp/convert_hf_to_gguf.py +677 -405
  54. vendor_llama_cpp_pydist/llama.cpp/convert_hf_to_gguf_update.py +1 -0
  55. vendor_llama_cpp_pydist/llama.cpp/docs/android/imported-into-android-studio.jpg +0 -0
  56. vendor_llama_cpp_pydist/llama.cpp/docs/android.md +22 -2
  57. vendor_llama_cpp_pydist/llama.cpp/docs/backend/SYCL.md +2 -0
  58. vendor_llama_cpp_pydist/llama.cpp/docs/backend/ZenDNN.md +258 -0
  59. vendor_llama_cpp_pydist/llama.cpp/docs/backend/hexagon/CMakeUserPresets.json +2 -0
  60. vendor_llama_cpp_pydist/llama.cpp/docs/backend/zDNN.md +5 -0
  61. vendor_llama_cpp_pydist/llama.cpp/docs/build-riscv64-spacemit.md +1 -0
  62. vendor_llama_cpp_pydist/llama.cpp/docs/build.md +32 -0
  63. vendor_llama_cpp_pydist/llama.cpp/docs/development/HOWTO-add-model.md +3 -2
  64. vendor_llama_cpp_pydist/llama.cpp/docs/docker.md +18 -14
  65. vendor_llama_cpp_pydist/llama.cpp/docs/ops/CPU.csv +474 -20
  66. vendor_llama_cpp_pydist/llama.cpp/docs/ops/CUDA.csv +488 -34
  67. vendor_llama_cpp_pydist/llama.cpp/docs/ops/OpenCL.csv +15130 -4510
  68. vendor_llama_cpp_pydist/llama.cpp/docs/ops/SYCL.csv +797 -361
  69. vendor_llama_cpp_pydist/llama.cpp/docs/ops/WebGPU.csv +18741 -0
  70. vendor_llama_cpp_pydist/llama.cpp/docs/ops/ZenDNN.csv +18741 -0
  71. vendor_llama_cpp_pydist/llama.cpp/docs/ops.md +109 -108
  72. vendor_llama_cpp_pydist/llama.cpp/ggml/CMakeLists.txt +10 -0
  73. vendor_llama_cpp_pydist/llama.cpp/ggml/include/ggml-alloc.h +9 -0
  74. vendor_llama_cpp_pydist/llama.cpp/ggml/include/ggml-backend.h +1 -0
  75. vendor_llama_cpp_pydist/llama.cpp/ggml/include/ggml-cpu.h +1 -0
  76. vendor_llama_cpp_pydist/llama.cpp/ggml/include/ggml-rpc.h +1 -2
  77. vendor_llama_cpp_pydist/llama.cpp/ggml/include/ggml-zendnn.h +22 -0
  78. vendor_llama_cpp_pydist/llama.cpp/ggml/include/ggml.h +29 -8
  79. vendor_llama_cpp_pydist/llama.cpp/ggml/src/CMakeLists.txt +4 -0
  80. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-alloc.c +72 -25
  81. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-backend-reg.cpp +19 -3
  82. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-backend.cpp +21 -2
  83. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cann/aclnn_ops.cpp +153 -61
  84. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cann/common.h +2 -2
  85. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cann/ggml-cann.cpp +9 -8
  86. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cpu/CMakeLists.txt +7 -0
  87. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cpu/arch/arm/repack.cpp +285 -0
  88. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cpu/arch-fallback.h +28 -0
  89. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cpu/ggml-cpu.c +120 -45
  90. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cpu/ggml-cpu.cpp +4 -0
  91. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cpu/ops.cpp +38 -11
  92. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cpu/repack.cpp +288 -1
  93. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cpu/repack.h +8 -0
  94. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cpu/vec.cpp +41 -1
  95. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cpu/vec.h +125 -22
  96. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/argmax.cu +2 -2
  97. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/common.cuh +14 -11
  98. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/diag.cu +77 -0
  99. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/diag.cuh +5 -0
  100. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/fattn-common.cuh +3 -3
  101. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/fattn-mma-f16.cuh +20 -23
  102. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/fattn-tile.cuh +11 -0
  103. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/fattn.cu +15 -1
  104. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/fill.cu +37 -0
  105. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/fill.cuh +3 -0
  106. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/ggml-cuda.cu +13 -2
  107. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/mma.cuh +194 -83
  108. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/mmf.cu +3 -1
  109. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/mmf.cuh +14 -10
  110. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/mmq.cuh +36 -29
  111. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/mmvf.cu +4 -1
  112. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/pad.cu +64 -33
  113. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/solve_tri.cu +118 -46
  114. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/ssm-conv.cu +14 -20
  115. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/vendors/hip.h +4 -0
  116. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-cuda/vendors/musa.h +5 -0
  117. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-hexagon/CMakeLists.txt +3 -1
  118. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-hexagon/ggml-hexagon.cpp +19 -7
  119. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-hexagon/htp/CMakeLists.txt +2 -1
  120. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-hexagon/htp/act-ops.c +90 -2
  121. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-hexagon/htp/htp-msg.h +6 -5
  122. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-hexagon/htp/hvx-utils.c +154 -47
  123. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-hexagon/htp/hvx-utils.h +57 -0
  124. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-hexagon/htp/main.c +2 -0
  125. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-hexagon/htp/matmul-ops.c +176 -28
  126. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-hexagon/htp/rope-ops.c +37 -41
  127. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-metal/ggml-metal-context.m +26 -16
  128. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-metal/ggml-metal-device.cpp +38 -1
  129. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-metal/ggml-metal-device.h +16 -0
  130. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-metal/ggml-metal-device.m +175 -28
  131. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-metal/ggml-metal-impl.h +1 -0
  132. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-metal/ggml-metal-ops.cpp +36 -8
  133. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-metal/ggml-metal.metal +127 -9
  134. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-opencl/ggml-opencl.cpp +4 -0
  135. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-rpc/ggml-rpc.cpp +40 -9
  136. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/add-id.cpp +77 -0
  137. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/add-id.hpp +8 -0
  138. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/common.hpp +17 -0
  139. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/convert.cpp +34 -0
  140. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/dequantize.hpp +18 -0
  141. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/dpct/helper.hpp +56 -3
  142. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/element_wise.cpp +97 -0
  143. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/element_wise.hpp +4 -0
  144. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/ggml-sycl.cpp +21 -6
  145. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/mmvq.cpp +22 -0
  146. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/pad.cpp +5 -5
  147. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/softmax.cpp +1 -1
  148. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/ssm_conv.cpp +1 -1
  149. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-sycl/vecdotq.hpp +58 -0
  150. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/ggml-vulkan.cpp +421 -363
  151. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/conv2d_mm.comp +8 -13
  152. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/diag.comp +29 -0
  153. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/flash_attn.comp +3 -0
  154. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/flash_attn_cm1.comp +3 -0
  155. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/get_rows.comp +2 -2
  156. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_iq1_m.comp +70 -20
  157. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_iq1_s.comp +40 -24
  158. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/mul_mm_funcs.glsl +8 -5
  159. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/pad.comp +20 -5
  160. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/rms_norm.comp +5 -1
  161. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/soft_max_large1.comp +62 -0
  162. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/soft_max_large2.comp +79 -0
  163. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/soft_max_large3.comp +65 -0
  164. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/soft_max_large_common.glsl +53 -0
  165. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/solve_tri.comp +36 -27
  166. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/topk_moe.comp +18 -11
  167. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/topk_nary_search.comp +58 -16
  168. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp +14 -3
  169. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-webgpu/ggml-webgpu.cpp +606 -364
  170. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-webgpu/wgsl-shaders/embed_wgsl.py +16 -1
  171. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-webgpu/wgsl-shaders/unary_op.wgsl +461 -0
  172. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-zendnn/CMakeLists.txt +92 -0
  173. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml-zendnn/ggml-zendnn.cpp +466 -0
  174. vendor_llama_cpp_pydist/llama.cpp/ggml/src/ggml.c +58 -2
  175. vendor_llama_cpp_pydist/llama.cpp/gguf-py/gguf/constants.py +89 -0
  176. vendor_llama_cpp_pydist/llama.cpp/gguf-py/gguf/tensor_mapping.py +107 -3
  177. vendor_llama_cpp_pydist/llama.cpp/gguf-py/gguf/utility.py +1 -1
  178. vendor_llama_cpp_pydist/llama.cpp/grammars/README.md +27 -3
  179. vendor_llama_cpp_pydist/llama.cpp/include/llama.h +18 -1
  180. vendor_llama_cpp_pydist/llama.cpp/pyrightconfig.json +1 -1
  181. vendor_llama_cpp_pydist/llama.cpp/scripts/compare-logprobs.py +281 -0
  182. vendor_llama_cpp_pydist/llama.cpp/scripts/snapdragon/adb/run-cli.sh +1 -1
  183. vendor_llama_cpp_pydist/llama.cpp/scripts/snapdragon/adb/run-mtmd.sh +65 -0
  184. vendor_llama_cpp_pydist/llama.cpp/scripts/sync-ggml.last +1 -1
  185. vendor_llama_cpp_pydist/llama.cpp/src/CMakeLists.txt +2 -1
  186. vendor_llama_cpp_pydist/llama.cpp/src/llama-arch.cpp +1890 -2248
  187. vendor_llama_cpp_pydist/llama.cpp/src/llama-arch.h +9 -2
  188. vendor_llama_cpp_pydist/llama.cpp/src/llama-batch.cpp +12 -2
  189. vendor_llama_cpp_pydist/llama.cpp/src/llama-batch.h +4 -2
  190. vendor_llama_cpp_pydist/llama.cpp/src/llama-context.cpp +99 -29
  191. vendor_llama_cpp_pydist/llama.cpp/src/llama-context.h +9 -3
  192. vendor_llama_cpp_pydist/llama.cpp/src/llama-grammar.cpp +233 -33
  193. vendor_llama_cpp_pydist/llama.cpp/src/llama-grammar.h +20 -1
  194. vendor_llama_cpp_pydist/llama.cpp/src/llama-graph.cpp +85 -17
  195. vendor_llama_cpp_pydist/llama.cpp/src/llama-graph.h +17 -4
  196. vendor_llama_cpp_pydist/llama.cpp/src/llama-hparams.cpp +6 -0
  197. vendor_llama_cpp_pydist/llama.cpp/src/llama-hparams.h +5 -1
  198. vendor_llama_cpp_pydist/llama.cpp/src/llama-impl.cpp +4 -0
  199. vendor_llama_cpp_pydist/llama.cpp/src/llama-kv-cache.cpp +90 -42
  200. vendor_llama_cpp_pydist/llama.cpp/src/llama-kv-cache.h +19 -2
  201. vendor_llama_cpp_pydist/llama.cpp/src/llama-memory-hybrid.cpp +1 -1
  202. vendor_llama_cpp_pydist/llama.cpp/src/llama-mmap.cpp +123 -28
  203. vendor_llama_cpp_pydist/llama.cpp/src/llama-mmap.h +5 -1
  204. vendor_llama_cpp_pydist/llama.cpp/src/llama-model-loader.cpp +58 -13
  205. vendor_llama_cpp_pydist/llama.cpp/src/llama-model-loader.h +2 -0
  206. vendor_llama_cpp_pydist/llama.cpp/src/llama-model.cpp +134 -57
  207. vendor_llama_cpp_pydist/llama.cpp/src/llama-model.h +1 -0
  208. vendor_llama_cpp_pydist/llama.cpp/src/llama-quant.cpp +1 -28
  209. vendor_llama_cpp_pydist/llama.cpp/src/llama-sampling.cpp +16 -0
  210. vendor_llama_cpp_pydist/llama.cpp/src/llama-vocab.cpp +2 -1
  211. vendor_llama_cpp_pydist/llama.cpp/src/llama.cpp +665 -1
  212. vendor_llama_cpp_pydist/llama.cpp/src/models/deepseek2.cpp +27 -5
  213. vendor_llama_cpp_pydist/llama.cpp/src/models/{gemma3-iswa.cpp → gemma3.cpp} +30 -5
  214. vendor_llama_cpp_pydist/llama.cpp/src/models/glm4-moe.cpp +28 -11
  215. vendor_llama_cpp_pydist/llama.cpp/src/models/glm4.cpp +27 -4
  216. vendor_llama_cpp_pydist/llama.cpp/src/models/models.h +8 -7
  217. vendor_llama_cpp_pydist/llama.cpp/src/models/nemotron-h.cpp +35 -6
  218. vendor_llama_cpp_pydist/llama.cpp/src/models/qwen2.cpp +12 -3
  219. vendor_llama_cpp_pydist/llama.cpp/src/models/qwen3next.cpp +81 -266
  220. vendor_llama_cpp_pydist/llama.cpp/tests/CMakeLists.txt +8 -0
  221. vendor_llama_cpp_pydist/llama.cpp/tests/test-arg-parser.cpp +43 -6
  222. vendor_llama_cpp_pydist/llama.cpp/tests/test-backend-ops.cpp +183 -37
  223. vendor_llama_cpp_pydist/llama.cpp/tests/test-barrier.cpp +156 -14
  224. vendor_llama_cpp_pydist/llama.cpp/tests/test-chat.cpp +459 -15
  225. vendor_llama_cpp_pydist/llama.cpp/tests/test-grammar-integration.cpp +108 -3
  226. vendor_llama_cpp_pydist/llama.cpp/tests/test-grammar-parser.cpp +14 -0
  227. vendor_llama_cpp_pydist/llama.cpp/tests/test-json-schema-to-grammar.cpp +75 -0
  228. vendor_llama_cpp_pydist/llama.cpp/tests/test-llama-grammar.cpp +1 -1
  229. vendor_llama_cpp_pydist/llama.cpp/tests/test-lora-conversion-inference.sh +6 -6
  230. vendor_llama_cpp_pydist/llama.cpp/tests/test-state-restore-fragmented.cpp +122 -0
  231. vendor_llama_cpp_pydist/llama.cpp/tools/CMakeLists.txt +3 -1
  232. vendor_llama_cpp_pydist/llama.cpp/tools/cli/CMakeLists.txt +10 -0
  233. vendor_llama_cpp_pydist/llama.cpp/tools/cli/README.md +1 -0
  234. vendor_llama_cpp_pydist/llama.cpp/tools/cli/cli.cpp +395 -0
  235. vendor_llama_cpp_pydist/llama.cpp/tools/{main → completion}/CMakeLists.txt +2 -2
  236. vendor_llama_cpp_pydist/llama.cpp/tools/{main → completion}/README.md +16 -16
  237. vendor_llama_cpp_pydist/llama.cpp/tools/{main/main.cpp → completion/completion.cpp} +15 -26
  238. vendor_llama_cpp_pydist/llama.cpp/tools/cvector-generator/cvector-generator.cpp +3 -3
  239. vendor_llama_cpp_pydist/llama.cpp/tools/fit-params/CMakeLists.txt +8 -0
  240. vendor_llama_cpp_pydist/llama.cpp/tools/fit-params/README.md +55 -0
  241. vendor_llama_cpp_pydist/llama.cpp/tools/fit-params/fit-params.cpp +66 -0
  242. vendor_llama_cpp_pydist/llama.cpp/tools/gguf-split/tests.sh +1 -1
  243. vendor_llama_cpp_pydist/llama.cpp/tools/imatrix/imatrix.cpp +3 -3
  244. vendor_llama_cpp_pydist/llama.cpp/tools/llama-bench/README.md +1 -1
  245. vendor_llama_cpp_pydist/llama.cpp/tools/llama-bench/llama-bench.cpp +2 -1
  246. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/CMakeLists.txt +28 -2
  247. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/clip-graph.h +121 -0
  248. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/clip-impl.h +37 -1
  249. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/clip-model.h +331 -0
  250. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/clip.cpp +729 -2216
  251. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/clip.h +3 -1
  252. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/cogvlm.cpp +98 -0
  253. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/conformer.cpp +217 -0
  254. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/glm4v.cpp +120 -0
  255. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/internvl.cpp +69 -0
  256. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/kimivl.cpp +63 -0
  257. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/llama4.cpp +96 -0
  258. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/llava.cpp +374 -0
  259. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/minicpmv.cpp +114 -0
  260. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/models.h +68 -0
  261. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/pixtral.cpp +86 -0
  262. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/qwen2vl.cpp +183 -0
  263. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/qwen3vl.cpp +191 -0
  264. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/siglip.cpp +81 -0
  265. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/models/whisper-enc.cpp +106 -0
  266. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/mtmd-audio.cpp +371 -550
  267. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/mtmd-audio.h +20 -27
  268. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/mtmd-cli.cpp +30 -7
  269. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/mtmd-helper.cpp +4 -0
  270. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/mtmd.cpp +29 -13
  271. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/mtmd.h +5 -0
  272. vendor_llama_cpp_pydist/llama.cpp/tools/mtmd/tests.sh +33 -19
  273. vendor_llama_cpp_pydist/llama.cpp/tools/perplexity/perplexity.cpp +3 -3
  274. vendor_llama_cpp_pydist/llama.cpp/tools/quantize/tests.sh +1 -1
  275. vendor_llama_cpp_pydist/llama.cpp/tools/server/CMakeLists.txt +29 -3
  276. vendor_llama_cpp_pydist/llama.cpp/tools/server/README-dev.md +177 -0
  277. vendor_llama_cpp_pydist/llama.cpp/tools/server/README.md +138 -171
  278. vendor_llama_cpp_pydist/llama.cpp/tools/server/public/index.html.gz +0 -0
  279. vendor_llama_cpp_pydist/llama.cpp/tools/server/server-common.cpp +15 -12
  280. vendor_llama_cpp_pydist/llama.cpp/tools/server/server-common.h +4 -0
  281. vendor_llama_cpp_pydist/llama.cpp/tools/server/server-context.cpp +306 -127
  282. vendor_llama_cpp_pydist/llama.cpp/tools/server/server-context.h +12 -2
  283. vendor_llama_cpp_pydist/llama.cpp/tools/server/server-models.cpp +178 -210
  284. vendor_llama_cpp_pydist/llama.cpp/tools/server/server-models.h +34 -15
  285. vendor_llama_cpp_pydist/llama.cpp/tools/server/server-queue.cpp +11 -2
  286. vendor_llama_cpp_pydist/llama.cpp/tools/server/server-queue.h +6 -3
  287. vendor_llama_cpp_pydist/llama.cpp/tools/server/server-task.cpp +14 -7
  288. vendor_llama_cpp_pydist/llama.cpp/tools/server/server-task.h +62 -25
  289. vendor_llama_cpp_pydist/llama.cpp/tools/server/server.cpp +19 -9
  290. vendor_llama_cpp_pydist/llama.cpp/tools/server/tests/unit/test_chat_completion.py +19 -0
  291. vendor_llama_cpp_pydist/llama.cpp/tools/server/tests/unit/test_compat_anthropic.py +1 -1
  292. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/README.md +6 -5
  293. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/docs/architecture/high-level-architecture-simplified.md +6 -2
  294. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/docs/architecture/high-level-architecture.md +13 -3
  295. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/package-lock.json +32 -24
  296. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/package.json +4 -5
  297. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/app.d.ts +7 -0
  298. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatAttachments/ChatAttachmentPreview.svelte +1 -1
  299. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatAttachments/ChatAttachmentThumbnailFile.svelte +1 -1
  300. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatForm/ChatForm.svelte +29 -3
  301. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatForm/ChatFormActions/ChatFormActionFileAttachments.svelte +1 -1
  302. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatForm/ChatFormActions/ChatFormActions.svelte +1 -0
  303. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatMessages/ChatMessage.svelte +77 -11
  304. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatMessages/ChatMessageAssistant.svelte +4 -2
  305. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatMessages/ChatMessageEditForm.svelte +391 -0
  306. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatMessages/ChatMessageStatistics.svelte +108 -6
  307. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatMessages/ChatMessageSystem.svelte +216 -0
  308. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatMessages/ChatMessageUser.svelte +27 -49
  309. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatMessages/ChatMessages.svelte +17 -5
  310. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatScreen/ChatScreen.svelte +21 -4
  311. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatScreen/ChatScreenHeader.svelte +6 -1
  312. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatSettings/ChatSettings.svelte +22 -7
  313. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatSettings/ChatSettingsFields.svelte +17 -2
  314. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatSettings/ChatSettingsImportExportTab.svelte +68 -2
  315. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatSidebar/ChatSidebar.svelte +11 -1
  316. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatSidebar/ChatSidebarConversationItem.svelte +51 -2
  317. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/chat/ChatSidebar/ChatSidebarSearch.svelte +2 -16
  318. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/index.ts +3 -0
  319. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/misc/BadgeChatStatistic.svelte +26 -7
  320. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/misc/MarkdownContent.svelte +269 -169
  321. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/misc/SearchInput.svelte +73 -0
  322. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/misc/SyntaxHighlightedCode.svelte +3 -2
  323. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/models/ModelsSelector.svelte +272 -313
  324. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/app/server/ServerErrorSplash.svelte +2 -1
  325. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/ui/popover/index.ts +19 -0
  326. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/ui/popover/popover-close.svelte +7 -0
  327. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/ui/popover/popover-content.svelte +37 -0
  328. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/ui/popover/popover-portal.svelte +7 -0
  329. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/ui/popover/popover-trigger.svelte +17 -0
  330. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/ui/popover/popover.svelte +7 -0
  331. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/ui/switch/index.ts +7 -0
  332. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/components/ui/switch/switch.svelte +29 -0
  333. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/constants/floating-ui-constraints.ts +0 -1
  334. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/constants/settings-config.ts +12 -1
  335. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/enums/chat.ts +4 -0
  336. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/enums/index.ts +2 -0
  337. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/markdown/enhance-code-blocks.ts +162 -0
  338. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/markdown/enhance-links.ts +33 -0
  339. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/services/chat.ts +2 -44
  340. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/services/database.ts +43 -0
  341. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/services/parameter-sync.spec.ts +14 -0
  342. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/services/parameter-sync.ts +75 -13
  343. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/stores/chat.svelte.ts +283 -178
  344. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/stores/conversations.svelte.ts +24 -2
  345. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/stores/models.svelte.ts +25 -1
  346. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/stores/server.svelte.ts +4 -0
  347. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/stores/settings.svelte.ts +2 -1
  348. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/types/api.d.ts +2 -0
  349. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/types/chat.d.ts +1 -1
  350. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/utils/api-key-validation.ts +2 -1
  351. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/utils/clipboard.ts +262 -0
  352. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/utils/file-preview.ts +0 -9
  353. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/utils/index.ts +11 -2
  354. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/utils/latex-protection.ts +13 -10
  355. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/utils/text.ts +7 -0
  356. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/routes/+layout.svelte +25 -9
  357. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/tests/unit/clipboard.test.ts +423 -0
  358. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/{src/lib/utils → tests/unit}/latex-protection.test.ts +22 -1
  359. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/{src/lib/utils → tests/unit}/model-names.test.ts +1 -1
  360. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/vite.config.ts +2 -2
  361. vendor_llama_cpp_pydist/llama.cpp/tools/tts/tts.cpp +6 -6
  362. vendor_llama_cpp_pydist/llama.cpp/vendor/cpp-httplib/CMakeLists.txt +5 -0
  363. llama_cpp_pydist-0.17.0.dist-info/METADATA +0 -1347
  364. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/src/lib/utils/copy.ts +0 -71
  365. vendor_llama_cpp_pydist/llama.cpp/tools/server/webui/tests/server/demo.spec.ts +0 -7
  366. {llama_cpp_pydist-0.17.0.dist-info → llama_cpp_pydist-0.19.0.dist-info}/WHEEL +0 -0
  367. {llama_cpp_pydist-0.17.0.dist-info → llama_cpp_pydist-0.19.0.dist-info}/licenses/LICENSE +0 -0
  368. {llama_cpp_pydist-0.17.0.dist-info → llama_cpp_pydist-0.19.0.dist-info}/top_level.txt +0 -0