llama-cpp-python 0.2.28__tar.gz → 0.2.29__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (612) hide show
  1. llama_cpp_python-0.2.29/.git/FETCH_HEAD +1 -0
  2. llama_cpp_python-0.2.29/.git/HEAD +1 -0
  3. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/config +1 -1
  4. llama_cpp_python-0.2.29/.git/index +0 -0
  5. llama_cpp_python-0.2.29/.git/logs/HEAD +1 -0
  6. llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/HEAD +1 -0
  7. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/config +1 -1
  8. llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/index +0 -0
  9. llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/logs/HEAD +2 -0
  10. llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/logs/refs/heads/master +1 -0
  11. llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/logs/refs/remotes/origin/HEAD +1 -0
  12. llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/objects/pack/pack-089f43df9dfbcbef5693213d630b739a6bd96e17.idx +0 -0
  13. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/objects/pack/pack-51c0c02c987a3a975ed4edb03bbd1999de104e16.pack → llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/objects/pack/pack-089f43df9dfbcbef5693213d630b739a6bd96e17.pack +0 -0
  14. llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/objects/pack/pack-089f43df9dfbcbef5693213d630b739a6bd96e17.rev +0 -0
  15. llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/packed-refs +2 -0
  16. llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/refs/heads/master +1 -0
  17. llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/refs/tags/b1878 +1 -0
  18. llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/shallow +1 -0
  19. llama_cpp_python-0.2.29/.git/objects/02/c09afb0bf5559d3fe64ce67f4ff82af32ff50f +0 -0
  20. llama_cpp_python-0.2.29/.git/objects/03/6b2ddd1f34297fc03f715b82fd66945e9147ea +0 -0
  21. llama_cpp_python-0.2.29/.git/objects/1a/5152530cfbde487c928b60269a29fa5219f617 +0 -0
  22. llama_cpp_python-0.2.29/.git/objects/1b/78703a3fcd25c369a170cc7c94ca5a0a0e3baf +0 -0
  23. llama_cpp_python-0.2.29/.git/objects/4b/11fa83c00a3c04cfb47775ffcd226167d52044 +0 -0
  24. llama_cpp_python-0.2.29/.git/objects/50/6ab1f7ef5b87b110a38090b844b19b63c5bb8c +0 -0
  25. llama_cpp_python-0.2.29/.git/objects/65/206bf28d4bcaebea79c68bbd4e526aed5da6b3 +0 -0
  26. llama_cpp_python-0.2.29/.git/objects/6e/7ace3b7938f7c58a9ef2bf593c13691c03cf45 +0 -0
  27. llama_cpp_python-0.2.29/.git/objects/90/2a43919c5d79d1d418aee2d1512c2e92e8a00b +0 -0
  28. llama_cpp_python-0.2.29/.git/objects/9e/8e3cec752c06b0fd8cebdebbc6dcf7cade1a5a +0 -0
  29. llama_cpp_python-0.2.29/.git/objects/a4/5e5d77363eb85144d4aff1a3cbe86ce94d5c92 +0 -0
  30. llama_cpp_python-0.2.29/.git/objects/ba/14c5172dd87bbfcee083a5eac8c0511bb0c633 +0 -0
  31. llama_cpp_python-0.2.29/.git/objects/c0/2e656426ce672792fd20cb55c9616067974520 +0 -0
  32. llama_cpp_python-0.2.29/.git/objects/c0/748ee14e43d553bccbf402a4ed6c13b563b453 +0 -0
  33. llama_cpp_python-0.2.29/.git/objects/d1/ae9b564d3ab02c6b91162e52d822d36524edb3 +0 -0
  34. llama_cpp_python-0.2.29/.git/objects/e4/be9d1c98b789ed81b2d0fbdd28a441f267f489 +0 -0
  35. llama_cpp_python-0.2.29/.git/objects/ef/9392b7a3d1f6802cef539eea18185eb50c61af +2 -0
  36. llama_cpp_python-0.2.29/.git/objects/f7/b6ba6b1950c0c0a796d996f980e763bd9641cb +0 -0
  37. llama_cpp_python-0.2.29/.git/objects/f9/be3237d374ae1fa7e6d7e9587f17636b0a4f35 +0 -0
  38. llama_cpp_python-0.2.29/.git/refs/tags/v0.2.29 +1 -0
  39. llama_cpp_python-0.2.29/.git/shallow +1 -0
  40. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/CHANGELOG.md +9 -0
  41. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/PKG-INFO +1 -1
  42. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/common.py +1 -1
  43. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/low_level_api_chat_cpp.py +36 -14
  44. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/__init__.py +1 -1
  45. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/_utils.py +9 -11
  46. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/llama.py +38 -1
  47. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/llama_cpp.py +67 -13
  48. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/llama_grammar.py +0 -1
  49. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/model.py +19 -1
  50. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/settings.py +8 -0
  51. llama_cpp_python-0.2.29/tests/test_grammar.py +52 -0
  52. llama_cpp_python-0.2.29/vendor/llama.cpp/.github/workflows/nix-ci-aarch64.yml +55 -0
  53. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/nix-ci.yml +0 -41
  54. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/nix-flake-update.yml +1 -1
  55. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.gitignore +1 -0
  56. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/CMakeLists.txt +6 -2
  57. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/Makefile +4 -10
  58. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/Package.swift +1 -1
  59. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/awq-py/README.md +1 -1
  60. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/build-info.cpp +1 -1
  61. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/common.cpp +57 -29
  62. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/common.h +3 -1
  63. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/sampling.cpp +5 -4
  64. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert-hf-to-gguf.py +35 -13
  65. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/CMakeLists.txt +1 -3
  66. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched-bench/batched-bench.cpp +3 -0
  67. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/benchmark/benchmark-matmult.cpp +2 -2
  68. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/export-lora/export-lora.cpp +1 -2
  69. llama_cpp_python-0.2.29/vendor/llama.cpp/examples/imatrix/CMakeLists.txt +5 -0
  70. llama_cpp_python-0.2.29/vendor/llama.cpp/examples/imatrix/imatrix.cpp +380 -0
  71. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama-bench/llama-bench.cpp +78 -68
  72. llama_cpp_python-0.2.29/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Models/LlamaState.swift +189 -0
  73. llama_cpp_python-0.2.29/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/ContentView.swift +145 -0
  74. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/DownloadButton.swift +2 -0
  75. llama_cpp_python-0.2.29/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/InputButton.swift +131 -0
  76. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui.xcodeproj/project.pbxproj +6 -2
  77. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/clip.cpp +24 -38
  78. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main/main.cpp +11 -2
  79. llama_cpp_python-0.2.29/vendor/llama.cpp/examples/pydantic-models-to-grammar-examples.py +136 -0
  80. llama_cpp_python-0.2.29/vendor/llama.cpp/examples/pydantic_models_to_grammar.py +1151 -0
  81. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize/quantize.cpp +132 -2
  82. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/save-load-state/save-load-state.cpp +10 -11
  83. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/README.md +6 -1
  84. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/server.cpp +241 -122
  85. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-alloc.c +28 -6
  86. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-alloc.h +3 -1
  87. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-backend-impl.h +19 -19
  88. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-backend.c +476 -229
  89. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-backend.h +35 -25
  90. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-cuda.cu +894 -455
  91. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-cuda.h +7 -19
  92. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-impl.h +2 -0
  93. llama_cpp_python-0.2.29/vendor/llama.cpp/ggml-metal.h +64 -0
  94. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-metal.m +612 -776
  95. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-metal.metal +374 -4
  96. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-opencl.cpp +321 -14
  97. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-opencl.h +13 -3
  98. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-quants.c +1681 -27
  99. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-quants.h +21 -2
  100. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml.c +150 -58
  101. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml.h +20 -12
  102. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/constants.py +3 -0
  103. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/tensor_mapping.py +9 -0
  104. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/llama.cpp +1217 -1610
  105. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/llama.h +32 -8
  106. llama_cpp_python-0.2.29/vendor/llama.cpp/scripts/compare-llama-bench.py +374 -0
  107. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/sync-ggml-am.sh +13 -1
  108. llama_cpp_python-0.2.29/vendor/llama.cpp/scripts/sync-ggml.last +1 -0
  109. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-backend-ops.cpp +21 -7
  110. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-quantize-fns.cpp +3 -2
  111. llama_cpp_python-0.2.28/.git/FETCH_HEAD +0 -1
  112. llama_cpp_python-0.2.28/.git/HEAD +0 -1
  113. llama_cpp_python-0.2.28/.git/index +0 -0
  114. llama_cpp_python-0.2.28/.git/logs/HEAD +0 -1
  115. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/FETCH_HEAD +0 -1
  116. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/HEAD +0 -1
  117. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/index +0 -0
  118. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/logs/HEAD +0 -2
  119. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/logs/refs/heads/master +0 -1
  120. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/logs/refs/remotes/origin/HEAD +0 -1
  121. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/objects/3b/a26ebd66b91510725fa32a6180452bf45abf89 +0 -0
  122. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/objects/6e/fb8eb30e7025b168f3fda3ff83b9b386428ad6 +0 -0
  123. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/objects/b2/6b6f72fcaad1b45661afb97e2551ecc2afa075 +0 -0
  124. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/objects/pack/pack-51c0c02c987a3a975ed4edb03bbd1999de104e16.idx +0 -0
  125. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/objects/pack/pack-51c0c02c987a3a975ed4edb03bbd1999de104e16.rev +0 -0
  126. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/packed-refs +0 -2
  127. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/refs/heads/master +0 -1
  128. llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/shallow +0 -2
  129. llama_cpp_python-0.2.28/.git/objects/0c/3b2e0ef0eaaa91538814c8270822dd01c7b9b1 +0 -0
  130. llama_cpp_python-0.2.28/.git/objects/0e/f132b07175867c07ad06fa22ca6b95eca67b59 +0 -0
  131. llama_cpp_python-0.2.28/.git/objects/17/1f357f53b0de535157a2c9b4de04582784ec97 +0 -0
  132. llama_cpp_python-0.2.28/.git/objects/2e/24903c21db75253911a70039ac5622672db813 +0 -0
  133. llama_cpp_python-0.2.28/.git/objects/33/234fb5fc258e8c09a9626dbb299419c57cc399 +0 -0
  134. llama_cpp_python-0.2.28/.git/objects/34/6b4631ebd1f4af85e9988d4a528e00edba6375 +0 -0
  135. llama_cpp_python-0.2.28/.git/objects/44/b6d4a35d3caf0c65aef0a1c77ff0ab4077d405 +0 -0
  136. llama_cpp_python-0.2.28/.git/objects/50/61247a14e480ab1962c8ec8e5417557a12affb +0 -0
  137. llama_cpp_python-0.2.28/.git/objects/55/d08db5f514fb6847938e3d6489b99f737ba6e3 +0 -0
  138. llama_cpp_python-0.2.28/.git/objects/7c/819b0d699f4d334d8020bbd253d3f3f67b4abc +0 -0
  139. llama_cpp_python-0.2.28/.git/objects/8a/80063397bf2687cb3f4534710d607a5906c681 +0 -0
  140. llama_cpp_python-0.2.28/.git/objects/ab/d7b4cde5b5285a44472d8a760b5337c986c47b +0 -0
  141. llama_cpp_python-0.2.28/.git/objects/af/f397f476fb7773d0e89b0e8913c8b1f97ca3e4 +0 -0
  142. llama_cpp_python-0.2.28/.git/objects/b9/373b7ac641e6e9c8d8cc64951139205d91d8bc +0 -0
  143. llama_cpp_python-0.2.28/.git/objects/c8/4fd04498c2fb188ff7c2a59473035fc90eb990 +0 -0
  144. llama_cpp_python-0.2.28/.git/objects/ca/e7ebb7a833dafcd402a96bea3a9574f74f0ed5 +0 -0
  145. llama_cpp_python-0.2.28/.git/objects/eb/51c854fd5ee35f477dbdf46ced6f62448b7750 +0 -0
  146. llama_cpp_python-0.2.28/.git/objects/f0/159663d922a6a693b1f9aee335d8667ae7f39e +0 -0
  147. llama_cpp_python-0.2.28/.git/objects/f5/39ce179f4af1e6b26a8b64c39b6b13fb78d73e +0 -0
  148. llama_cpp_python-0.2.28/.git/refs/tags/v0.2.28 +0 -1
  149. llama_cpp_python-0.2.28/.git/shallow +0 -1
  150. llama_cpp_python-0.2.28/tests/test_grammar.py +0 -13
  151. llama_cpp_python-0.2.28/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Models/LlamaState.swift +0 -100
  152. llama_cpp_python-0.2.28/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/ContentView.swift +0 -138
  153. llama_cpp_python-0.2.28/vendor/llama.cpp/examples/metal/CMakeLists.txt +0 -4
  154. llama_cpp_python-0.2.28/vendor/llama.cpp/examples/metal/metal.cpp +0 -103
  155. llama_cpp_python-0.2.28/vendor/llama.cpp/ggml-metal.h +0 -115
  156. llama_cpp_python-0.2.28/vendor/llama.cpp/scripts/sync-ggml.last +0 -1
  157. llama_cpp_python-0.2.28/vendor/llama.cpp/spm-headers/ggml.h +0 -1
  158. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.dockerignore +0 -0
  159. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/description +0 -0
  160. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/applypatch-msg.sample +0 -0
  161. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/commit-msg.sample +0 -0
  162. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/fsmonitor-watchman.sample +0 -0
  163. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/post-update.sample +0 -0
  164. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/pre-applypatch.sample +0 -0
  165. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/pre-commit.sample +0 -0
  166. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/pre-merge-commit.sample +0 -0
  167. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/pre-push.sample +0 -0
  168. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/pre-rebase.sample +0 -0
  169. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/pre-receive.sample +0 -0
  170. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/prepare-commit-msg.sample +0 -0
  171. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/push-to-checkout.sample +0 -0
  172. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/sendemail-validate.sample +0 -0
  173. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/update.sample +0 -0
  174. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/info/exclude +0 -0
  175. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/description +0 -0
  176. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/applypatch-msg.sample +0 -0
  177. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/commit-msg.sample +0 -0
  178. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/fsmonitor-watchman.sample +0 -0
  179. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/post-update.sample +0 -0
  180. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-applypatch.sample +0 -0
  181. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-commit.sample +0 -0
  182. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-merge-commit.sample +0 -0
  183. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-push.sample +0 -0
  184. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-rebase.sample +0 -0
  185. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-receive.sample +0 -0
  186. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/prepare-commit-msg.sample +0 -0
  187. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/push-to-checkout.sample +0 -0
  188. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/sendemail-validate.sample +0 -0
  189. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/update.sample +0 -0
  190. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/info/exclude +0 -0
  191. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/refs/remotes/origin/HEAD +0 -0
  192. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/04/5856ea2ffe697ec33db1c1c989bd45cde5bb3d +0 -0
  193. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/04/7bc14424303575f73af90611fec827334f54e8 +0 -0
  194. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/0d/870969f4b23bd92a09ec29134d3fb454d38bec +0 -0
  195. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/0e/2a907c0e40de1a432ee0cd2e3d01c634df1a37 +0 -0
  196. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/0e/f7bd4a856ec728adc565133e808628ea5566a1 +0 -0
  197. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/11/2a0f7872fa9244bf38729a2722dc5c08dec20c +0 -0
  198. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/11/b6d5c26e3f7157658952b8ec353e985d522fac +0 -0
  199. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/13/c5b6b0df5f67e80cbe584909b83777901265a1 +0 -0
  200. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/19/9bd4ffbf88c68c98b52c05f388dfa92716f6b7 +0 -0
  201. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/23/e37d4d40e5ec0bfd85b5e928834d58e2cf0da6 +0 -0
  202. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/24/04228325d88c59b819acaedb20b15635f75df9 +0 -0
  203. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/27/2e4767b47397d1529e6a2d01298144d9d746ba +0 -0
  204. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/27/a6b1e5042318f85dc99c9f24f4dd6fc472d242 +0 -0
  205. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/29/03e0146d304bcacbfabfe71f171a2edc03043e +0 -0
  206. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/2c/c6fb02dcb3226c1ecf0fbed6453eb3acadeaa2 +0 -0
  207. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/39/697bfc2538bd4558018d0d721d6d6028c4bb56 +0 -0
  208. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/3a/1d7180d508818fe957923e00dcd8950938632d +0 -0
  209. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/3a/6457dcdfd47e764654bacae0ba8347976b645a +0 -0
  210. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/41/cc68ea2402cf682807649d841e7c0f4175db01 +0 -0
  211. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/47/4503fdfc554d8caabee4f321a80427f8c7d696 +0 -0
  212. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/4b/3189dd1a54be3bc416786ddf184dd047dc4b20 +0 -0
  213. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/51/f357200f8b998031f4be924e11ed2ae4bf3fea +0 -0
  214. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/56/2410fe1a4c4093d62e1705933eaf66c6d99a2c +0 -0
  215. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/5b/51e98ce432974ff031367f8937babe755e3d73 +0 -0
  216. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/5f/350ffe99abe7297b2839f36fd0eaeb98887805 +0 -0
  217. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/60/bc7aef42aac0409cfdca666ad2ff6f516d7b5b +0 -0
  218. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/61/027ef99725c50b0891fdbf0bf263a33abe648f +0 -0
  219. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/68/7316b327ca038d26a338b3070a7d4698322515 +0 -0
  220. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/74/7c6130e3cb1479d20e2013b1dd3db3379c2266 +0 -0
  221. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/76/e26fbd106895fba52861f8ac1e11cc6ee2a307 +0 -0
  222. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/79/5dad726ae91f330c56e49bc188080b5b3b5ba9 +0 -0
  223. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/79/a9e67a1aee09c6d182f240ba5eef32feabcbce +0 -0
  224. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/7a/7b899ec7dd48d192cba14ac9c8e9df4233f7fb +0 -0
  225. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/7d/5498f9d2c49c1f731b47845d845f6c5e16a3d9 +0 -0
  226. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/7d/6c970483161eaf43cfa9d50010c071d4953053 +0 -0
  227. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/7e/df0975dc12ccc95ad14de085f07efe6d65c620 +0 -0
  228. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/7e/e8f748eab47180cea09c0ad8e75c3b991b4af4 +0 -0
  229. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/80/7b0f57a8a873e58ade0ff0f5b0bcf0ff66b7f9 +0 -0
  230. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/82/e5c4487e57d6d59c901a73bdd2a9bc172fee7c +0 -0
  231. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/8b/d03f88a1895cbf3ef249e13df79ee0efda779d +0 -0
  232. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/8e/32d2c0edce725a47b5845463133919cd766a61 +0 -0
  233. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/91/abb11fdf507883caeeb2d2958e1c65fb6cbdc1 +0 -0
  234. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/99/32d6130f5552a9b85c8b15b4ac6bc26b1068ce +0 -0
  235. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/9d/0ec2f705618e591cfa8d6512cb9a96b3da75f1 +0 -0
  236. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/9d/3d3559849603efda6f3c8181684e4d19e0ec79 +0 -0
  237. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/a9/e51cdc1672134ec9af66c9eccf09f6da4ceccd +0 -0
  238. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/ac/82b8fbb81087ec9b3a72d9e377102a31b28d16 +0 -0
  239. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/b1/f90b91594f496ad9f27b1a68584984f4b523d2 +0 -0
  240. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/b2/e879ec4bfb319459dd5357313ef06158c7039f +0 -0
  241. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/b5/affaa9d6087f3888dd9eedea209bb214b6e135 +0 -0
  242. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/b9/1632f5bc787c1404600c894a6a4126359747d8 +0 -0
  243. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/bb/cbbe7d61558adde3cbfd0c7a63a67c27ed6d30 +0 -0
  244. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/c5/4e4eb5ce2636abd78df46a7616cfe9196a1198 +0 -0
  245. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/c8/5e73d2b657bb05ed99309615d67bac93d9f86e +0 -0
  246. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/ca/ebbb67fdb02a0a8897d4e4826ea046a9931f6f +0 -0
  247. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/cc/6a3a7252ea6e698614f0629d4bc040ab6ca717 +0 -0
  248. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/cd/351ba33849dcf6af35b493f7405962fa1625d4 +0 -0
  249. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/d3/329eec3bac6ce7e54c76b77ac9bf99fab0fe3f +0 -0
  250. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/d3/efb3a6fe1e001db62ec08e5d31ce1d08567045 +0 -0
  251. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/da/c33b74dddf06fcfc01244044eebb102cfcea37 +0 -0
  252. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/e2/13518b95011cb6ee783986624c3b6de8659f81 +0 -0
  253. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/e4/1f375774e6945e445bfb179502b128fe22dda7 +0 -0
  254. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/e6/9de29bb2d1d6434b8b29ae775ad8c2e48c5391 +0 -0
  255. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/e9/30609ff5c479a1d5e12a8f3993582d421a6326 +0 -0
  256. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/eb/0fb9662e690d0f9de4632cddd321b3f872a725 +0 -0
  257. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/eb/9a2cfa9167df02f136502af79738c71363abfd +0 -0
  258. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/ef/1b2c0162e8edd321e2b9c1ce375d96f1f1d048 +0 -0
  259. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/f0/827d762e852a21f6406c469300899d5f509b8f +0 -0
  260. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/f1/b8e9d154231932c4b7b9b59611626764e68632 +0 -0
  261. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/f2/0813765a70679e8a063871c9ef75d75c65ccb6 +0 -0
  262. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/fa/dfc5fb4fe6f5eb6d5d98b62519e374a5202b00 +0 -0
  263. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/fc/25ff5160028dee3570249abc40cd57780bcca9 +0 -0
  264. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/fc/ef8cd800ee8a265b146748d178cb56b5632bf3 +0 -0
  265. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/fd/64c09b37947c97e58903ce570785c657d56722 +0 -0
  266. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/fe/b0ed68d94eac48b844fd587ddfb808649716a1 +0 -0
  267. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/ff/3e950cd1110fe552912cea4c268c4023d2b737 +0 -0
  268. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
  269. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
  270. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/dependabot.yml +0 -0
  271. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/workflows/build-and-release.yaml +0 -0
  272. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/workflows/build-docker.yaml +0 -0
  273. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/workflows/publish-to-test.yaml +0 -0
  274. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/workflows/publish.yaml +0 -0
  275. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/workflows/test-pypi.yaml +0 -0
  276. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/workflows/test.yaml +0 -0
  277. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.gitignore +0 -0
  278. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.gitmodules +0 -0
  279. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.readthedocs.yaml +0 -0
  280. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/CMakeLists.txt +0 -0
  281. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/LICENSE.md +0 -0
  282. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/Makefile +0 -0
  283. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/README.md +0 -0
  284. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/README.md +0 -0
  285. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/cuda_simple/Dockerfile +0 -0
  286. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/open_llama/Dockerfile +0 -0
  287. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/open_llama/build.sh +0 -0
  288. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/open_llama/hug_model.py +0 -0
  289. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/open_llama/start.sh +0 -0
  290. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/open_llama/start_server.sh +0 -0
  291. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/openblas_simple/Dockerfile +0 -0
  292. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/simple/Dockerfile +0 -0
  293. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/simple/run.sh +0 -0
  294. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docs/api-reference.md +0 -0
  295. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docs/changelog.md +0 -0
  296. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docs/index.md +0 -0
  297. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docs/install/macos.md +0 -0
  298. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docs/requirements.txt +0 -0
  299. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docs/server.md +0 -0
  300. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/high_level_api/fastapi_server.py +0 -0
  301. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/high_level_api/high_level_api_embedding.py +0 -0
  302. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/high_level_api/high_level_api_inference.py +0 -0
  303. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/high_level_api/high_level_api_streaming.py +0 -0
  304. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/high_level_api/langchain_custom_llm.py +0 -0
  305. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/Chat.py +0 -0
  306. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/Miku.py +0 -0
  307. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/ReasonAct.py +0 -0
  308. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/low_level_api_llama_cpp.py +0 -0
  309. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/quantize.py +0 -0
  310. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/readme/low_level_api_llama_cpp.md +0 -0
  311. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/util.py +0 -0
  312. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/notebooks/Batching.ipynb +0 -0
  313. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/notebooks/Clients.ipynb +0 -0
  314. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/notebooks/Functions.ipynb +0 -0
  315. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/notebooks/Guidance.ipynb +0 -0
  316. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/notebooks/Multimodal.ipynb +0 -0
  317. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/notebooks/PerformanceTuning.ipynb +0 -0
  318. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/llama_chat_format.py +0 -0
  319. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/llama_types.py +0 -0
  320. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/llava_cpp.py +0 -0
  321. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/py.typed +0 -0
  322. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/__init__.py +0 -0
  323. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/__main__.py +0 -0
  324. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/app.py +0 -0
  325. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/cli.py +0 -0
  326. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/errors.py +0 -0
  327. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/types.py +0 -0
  328. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/mkdocs.yml +0 -0
  329. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/pyproject.toml +0 -0
  330. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/tests/test_llama.py +0 -0
  331. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.clang-tidy +0 -0
  332. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/cloud-v-pipeline +0 -0
  333. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/full-cuda.Dockerfile +0 -0
  334. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/full-rocm.Dockerfile +0 -0
  335. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/full.Dockerfile +0 -0
  336. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/main-cuda.Dockerfile +0 -0
  337. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/main-rocm.Dockerfile +0 -0
  338. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/main.Dockerfile +0 -0
  339. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/apps.nix +0 -0
  340. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/devshells.nix +0 -0
  341. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/jetson-support.nix +0 -0
  342. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/nixpkgs-instances.nix +0 -0
  343. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/package.nix +0 -0
  344. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/scope.nix +0 -0
  345. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/tools.sh +0 -0
  346. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.dockerignore +0 -0
  347. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.ecrc +0 -0
  348. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.editorconfig +0 -0
  349. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.flake8 +0 -0
  350. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.git +0 -0
  351. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/ISSUE_TEMPLATE/bug.md +0 -0
  352. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/ISSUE_TEMPLATE/enhancement.md +0 -0
  353. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/build.yml +0 -0
  354. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/code-coverage.yml +0 -0
  355. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/docker.yml +0 -0
  356. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/editorconfig.yml +0 -0
  357. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/gguf-publish.yml +0 -0
  358. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/nix-publish-flake.yml +0 -0
  359. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/python-check-requirements.yml +0 -0
  360. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/python-lint.yml +0 -0
  361. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/tidy-post.yml +0 -0
  362. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/tidy-review.yml +0 -0
  363. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/zig-build.yml +0 -0
  364. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.pre-commit-config.yaml +0 -0
  365. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/LICENSE +0 -0
  366. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/README.md +0 -0
  367. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/SHA256SUMS +0 -0
  368. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/awq-py/awq/apply_awq.py +0 -0
  369. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/awq-py/requirements.txt +0 -0
  370. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/build.zig +0 -0
  371. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ci/README.md +0 -0
  372. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ci/run.sh +0 -0
  373. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/cmake/FindSIMD.cmake +0 -0
  374. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/codecov.yml +0 -0
  375. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/CMakeLists.txt +0 -0
  376. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/base64.hpp +0 -0
  377. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/build-info.cpp.in +0 -0
  378. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/console.cpp +0 -0
  379. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/console.h +0 -0
  380. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/grammar-parser.cpp +0 -0
  381. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/grammar-parser.h +0 -0
  382. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/log.h +0 -0
  383. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/sampling.h +0 -0
  384. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/stb_image.h +0 -0
  385. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/train.cpp +0 -0
  386. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/train.h +0 -0
  387. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert-llama-ggml-to-gguf.py +0 -0
  388. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert-lora-to-ggml.py +0 -0
  389. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert-persimmon-to-gguf.py +0 -0
  390. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert.py +0 -0
  391. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/docs/BLIS.md +0 -0
  392. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/docs/llama-star/idea-arch.key +0 -0
  393. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/docs/llama-star/idea-arch.pdf +0 -0
  394. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/docs/token_generation_performance_tips.md +0 -0
  395. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/Miku.sh +0 -0
  396. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/alpaca.sh +0 -0
  397. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/baby-llama/CMakeLists.txt +0 -0
  398. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/baby-llama/baby-llama.cpp +0 -0
  399. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/base-translate.sh +0 -0
  400. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched/CMakeLists.txt +0 -0
  401. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched/README.md +0 -0
  402. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched/batched.cpp +0 -0
  403. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched-bench/CMakeLists.txt +0 -0
  404. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched-bench/README.md +0 -0
  405. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/.gitignore +0 -0
  406. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/Makefile +0 -0
  407. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/Package.swift +0 -0
  408. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/README.md +0 -0
  409. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/Sources/main.swift +0 -0
  410. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/beam-search/CMakeLists.txt +0 -0
  411. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/beam-search/beam-search.cpp +0 -0
  412. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/benchmark/CMakeLists.txt +0 -0
  413. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat-13B.bat +0 -0
  414. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat-13B.sh +0 -0
  415. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat-persistent.sh +0 -0
  416. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat-vicuna.sh +0 -0
  417. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat.sh +0 -0
  418. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/convert-llama2c-to-ggml/CMakeLists.txt +0 -0
  419. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/convert-llama2c-to-ggml/README.md +0 -0
  420. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/convert-llama2c-to-ggml/convert-llama2c-to-ggml.cpp +0 -0
  421. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/embedding/CMakeLists.txt +0 -0
  422. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/embedding/README.md +0 -0
  423. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/embedding/embedding.cpp +0 -0
  424. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/export-lora/CMakeLists.txt +0 -0
  425. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/export-lora/README.md +0 -0
  426. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/CMakeLists.txt +0 -0
  427. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/README.md +0 -0
  428. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/convert-finetune-checkpoint-to-gguf.py +0 -0
  429. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/finetune.cpp +0 -0
  430. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/finetune.sh +0 -0
  431. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/gguf/CMakeLists.txt +0 -0
  432. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/gguf/gguf.cpp +0 -0
  433. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/gpt4all.sh +0 -0
  434. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/infill/CMakeLists.txt +0 -0
  435. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/infill/README.md +0 -0
  436. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/infill/infill.cpp +0 -0
  437. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/README.md +0 -0
  438. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/graph.py +0 -0
  439. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/jeopardy.sh +0 -0
  440. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/qasheet.csv +0 -0
  441. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/questions.txt +0 -0
  442. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/json-schema-to-grammar.py +0 -0
  443. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama-bench/CMakeLists.txt +0 -0
  444. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama-bench/README.md +0 -0
  445. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/.gitignore +0 -0
  446. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/README.md +0 -0
  447. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.cpp.swift/LibLlama.swift +0 -0
  448. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Assets.xcassets/AppIcon.appiconset/Contents.json +0 -0
  449. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Assets.xcassets/Contents.json +0 -0
  450. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/LoadCustomButton.swift +0 -0
  451. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/llama_swiftuiApp.swift +0 -0
  452. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui.xcodeproj/project.xcworkspace/contents.xcworkspacedata +0 -0
  453. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui.xcodeproj/project.xcworkspace/xcshareddata/IDEWorkspaceChecks.plist +0 -0
  454. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.vim +0 -0
  455. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama2-13b.sh +0 -0
  456. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama2.sh +0 -0
  457. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/CMakeLists.txt +0 -0
  458. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/README.md +0 -0
  459. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/clip.h +0 -0
  460. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/convert-image-encoder-to-gguf.py +0 -0
  461. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/llava-cli.cpp +0 -0
  462. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/llava-surgery.py +0 -0
  463. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/llava.cpp +0 -0
  464. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/llava.h +0 -0
  465. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llm.vim +0 -0
  466. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookahead/CMakeLists.txt +0 -0
  467. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookahead/README.md +0 -0
  468. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookahead/lookahead.cpp +0 -0
  469. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookup/CMakeLists.txt +0 -0
  470. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookup/README.md +0 -0
  471. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookup/lookup.cpp +0 -0
  472. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main/CMakeLists.txt +0 -0
  473. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main/README.md +0 -0
  474. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main-cmake-pkg/.gitignore +0 -0
  475. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main-cmake-pkg/CMakeLists.txt +0 -0
  476. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main-cmake-pkg/README.md +0 -0
  477. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/make-ggml.py +0 -0
  478. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/parallel/CMakeLists.txt +0 -0
  479. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/parallel/README.md +0 -0
  480. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/parallel/parallel.cpp +0 -0
  481. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/passkey/CMakeLists.txt +0 -0
  482. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/passkey/README.md +0 -0
  483. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/passkey/passkey.cpp +0 -0
  484. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/perplexity/CMakeLists.txt +0 -0
  485. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/perplexity/README.md +0 -0
  486. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/perplexity/perplexity.cpp +0 -0
  487. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize/CMakeLists.txt +0 -0
  488. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize/README.md +0 -0
  489. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize-stats/CMakeLists.txt +0 -0
  490. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize-stats/quantize-stats.cpp +0 -0
  491. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/reason-act.sh +0 -0
  492. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/save-load-state/CMakeLists.txt +0 -0
  493. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/CMakeLists.txt +0 -0
  494. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/api_like_OAI.py +0 -0
  495. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/chat-llama2.sh +0 -0
  496. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/chat.mjs +0 -0
  497. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/chat.sh +0 -0
  498. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/completion.js.hpp +0 -0
  499. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/deps.sh +0 -0
  500. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/httplib.h +0 -0
  501. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/index.html.hpp +0 -0
  502. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/index.js.hpp +0 -0
  503. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/json-schema-to-grammar.mjs.hpp +0 -0
  504. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/json.hpp +0 -0
  505. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/public/completion.js +0 -0
  506. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/public/index.html +0 -0
  507. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/public/index.js +0 -0
  508. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/public/json-schema-to-grammar.mjs +0 -0
  509. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server-llama2-13B.sh +0 -0
  510. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/simple/CMakeLists.txt +0 -0
  511. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/simple/README.md +0 -0
  512. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/simple/simple.cpp +0 -0
  513. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/speculative/CMakeLists.txt +0 -0
  514. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/speculative/README.md +0 -0
  515. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/speculative/speculative.cpp +0 -0
  516. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/tokenize/CMakeLists.txt +0 -0
  517. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/tokenize/tokenize.cpp +0 -0
  518. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/train-text-from-scratch/CMakeLists.txt +0 -0
  519. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/train-text-from-scratch/README.md +0 -0
  520. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/train-text-from-scratch/convert-train-checkpoint-to-gguf.py +0 -0
  521. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/train-text-from-scratch/train-text-from-scratch.cpp +0 -0
  522. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/flake.lock +0 -0
  523. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/flake.nix +0 -0
  524. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-mpi.c +0 -0
  525. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-mpi.h +0 -0
  526. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/LICENSE +0 -0
  527. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/README.md +0 -0
  528. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/examples/writer.py +0 -0
  529. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/__init__.py +0 -0
  530. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/gguf.py +0 -0
  531. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/gguf_reader.py +0 -0
  532. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/gguf_writer.py +0 -0
  533. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/py.typed +0 -0
  534. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/vocab.py +0 -0
  535. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/pyproject.toml +0 -0
  536. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/scripts/__init__.py +0 -0
  537. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/scripts/gguf-convert-endian.py +0 -0
  538. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/scripts/gguf-dump.py +0 -0
  539. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/scripts/gguf-set-metadata.py +0 -0
  540. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/tests/test_gguf.py +0 -0
  541. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/README.md +0 -0
  542. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/arithmetic.gbnf +0 -0
  543. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/c.gbnf +0 -0
  544. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/chess.gbnf +0 -0
  545. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/japanese.gbnf +0 -0
  546. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/json.gbnf +0 -0
  547. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/json_arr.gbnf +0 -0
  548. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/list.gbnf +0 -0
  549. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama-leader.jpeg +0 -0
  550. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama0-banner.png +0 -0
  551. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama0-logo.png +0 -0
  552. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama1-banner.png +0 -0
  553. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama1-logo.png +0 -0
  554. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/mypy.ini +0 -0
  555. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/pocs/CMakeLists.txt +0 -0
  556. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/pocs/vdot/CMakeLists.txt +0 -0
  557. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/pocs/vdot/q8dot.cpp +0 -0
  558. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/pocs/vdot/vdot.cpp +0 -0
  559. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/LLM-questions.txt +0 -0
  560. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/alpaca.txt +0 -0
  561. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/assistant.txt +0 -0
  562. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-baichuan.txt +0 -0
  563. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-bob.txt +0 -0
  564. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-qwen.txt +0 -0
  565. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-vicuna-v0.txt +0 -0
  566. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-vicuna-v1.txt +0 -0
  567. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat.txt +0 -0
  568. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/dan-modified.txt +0 -0
  569. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/dan.txt +0 -0
  570. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/mnemonics.txt +0 -0
  571. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/parallel-questions.txt +0 -0
  572. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/reason-act.txt +0 -0
  573. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert-hf-to-gguf.txt +0 -0
  574. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert-llama-ggml-to-gguf.txt +0 -0
  575. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert-lora-to-ggml.txt +0 -0
  576. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert-persimmon-to-gguf.txt +0 -0
  577. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert.txt +0 -0
  578. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements.txt +0 -0
  579. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/run_with_preset.py +0 -0
  580. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/LlamaConfig.cmake.in +0 -0
  581. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/build-info.cmake +0 -0
  582. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/build-info.sh +0 -0
  583. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/check-requirements.sh +0 -0
  584. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/convert-gg.sh +0 -0
  585. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/gen-build-info-cpp.cmake +0 -0
  586. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/get-flags.mk +0 -0
  587. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/get-pg.sh +0 -0
  588. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/get-wikitext-2.sh +0 -0
  589. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/qnt-all.sh +0 -0
  590. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/run-all-perf.sh +0 -0
  591. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/run-all-ppl.sh +0 -0
  592. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/server-llm.sh +0 -0
  593. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/sync-ggml.sh +0 -0
  594. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/verify-checksum-models.py +0 -0
  595. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/spm-headers/llama.h +0 -0
  596. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/CMakeLists.txt +0 -0
  597. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-c.c +0 -0
  598. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-double-float.cpp +0 -0
  599. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-grad0.cpp +0 -0
  600. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-grammar-parser.cpp +0 -0
  601. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-llama-grammar.cpp +0 -0
  602. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-opt.cpp +0 -0
  603. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-quantize-perf.cpp +0 -0
  604. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-rope.cpp +0 -0
  605. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-sampling.cpp +0 -0
  606. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-0-falcon.cpp +0 -0
  607. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-0-falcon.py +0 -0
  608. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-0-llama.cpp +0 -0
  609. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-0-llama.py +0 -0
  610. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-1-bpe.cpp +0 -0
  611. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-1-llama.cpp +0 -0
  612. {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/unicode.h +0 -0
@@ -0,0 +1 @@
1
+ 4b11fa83c00a3c04cfb47775ffcd226167d52044 '4b11fa83c00a3c04cfb47775ffcd226167d52044' of https://github.com/abetlen/llama-cpp-python
@@ -0,0 +1 @@
1
+ 4b11fa83c00a3c04cfb47775ffcd226167d52044
@@ -9,7 +9,7 @@
9
9
  [gc]
10
10
  auto = 0
11
11
  [http "https://github.com/"]
12
- extraheader = AUTHORIZATION: basic eC1hY2Nlc3MtdG9rZW46Z2hzX3o0cnV1YlBtbkRCRjlFeGplTTNOREdVajlMSUVudjE4NXhveA==
12
+ extraheader = AUTHORIZATION: basic eC1hY2Nlc3MtdG9rZW46Z2hzXzg0QXZkVFUxdjRsWmlJSlFjZHVISHVlZnBtUnA3STFDcUxkeA==
13
13
  [submodule "vendor/llama.cpp"]
14
14
  active = true
15
15
  url = https://github.com/ggerganov/llama.cpp.git
Binary file
@@ -0,0 +1 @@
1
+ 0000000000000000000000000000000000000000 4b11fa83c00a3c04cfb47775ffcd226167d52044 runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341384 +0000 checkout: moving from master to refs/tags/v0.2.29
@@ -0,0 +1 @@
1
+ 4483396751c79dea540808b9cb9238245d06da2b
@@ -13,7 +13,7 @@
13
13
  [gc]
14
14
  auto = 0
15
15
  [http "https://github.com/"]
16
- extraheader = AUTHORIZATION: basic eC1hY2Nlc3MtdG9rZW46Z2hzX3o0cnV1YlBtbkRCRjlFeGplTTNOREdVajlMSUVudjE4NXhveA==
16
+ extraheader = AUTHORIZATION: basic eC1hY2Nlc3MtdG9rZW46Z2hzXzg0QXZkVFUxdjRsWmlJSlFjZHVISHVlZnBtUnA3STFDcUxkeA==
17
17
  [url "https://github.com/"]
18
18
  insteadOf = git@github.com:
19
19
  insteadOf = org-6826477@github.com:
@@ -0,0 +1,2 @@
1
+ 0000000000000000000000000000000000000000 4483396751c79dea540808b9cb9238245d06da2b runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341385 +0000 clone: from https://github.com/ggerganov/llama.cpp.git
2
+ 4483396751c79dea540808b9cb9238245d06da2b 4483396751c79dea540808b9cb9238245d06da2b runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341385 +0000 checkout: moving from master to 4483396751c79dea540808b9cb9238245d06da2b
@@ -0,0 +1 @@
1
+ 0000000000000000000000000000000000000000 4483396751c79dea540808b9cb9238245d06da2b runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341385 +0000 clone: from https://github.com/ggerganov/llama.cpp.git
@@ -0,0 +1 @@
1
+ 0000000000000000000000000000000000000000 4483396751c79dea540808b9cb9238245d06da2b runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341385 +0000 clone: from https://github.com/ggerganov/llama.cpp.git
@@ -0,0 +1,2 @@
1
+ # pack-refs with: peeled fully-peeled sorted
2
+ 4483396751c79dea540808b9cb9238245d06da2b refs/remotes/origin/master
@@ -0,0 +1 @@
1
+ 4483396751c79dea540808b9cb9238245d06da2b
@@ -0,0 +1 @@
1
+ 4483396751c79dea540808b9cb9238245d06da2b
@@ -0,0 +1 @@
1
+ 4483396751c79dea540808b9cb9238245d06da2b
@@ -0,0 +1,2 @@
1
+ x}TM��0�Y�bPj��%�[ ��K�S��R�lM-��J����w4�Xg7�A���潑�u5���w�띏ж�SU��b,<g��� �-�=l6�)��N#o��d&�k�#s)�s��"���1���U�)_������,��g���Ζ�O��ǁS,9�^�4R��]T��l���& D�#�*c5�J��[�ɐ �0�gq�q4�����Z�h�)�(EO��o�@0Ny�~���1MK9����8��W06.q��JK�z �%AZ���„戝��y��wV���!R;�R�mU�g,Xz����#�2jN֥8������Dճ3�Q{�i��<�&��{�,��5 r�(���M�˽w=��A�H�P2��"�d)�A�s�����~�4�#=�<�eM����d��V`���'
2
+ .�����-����3��O9V<��R.�����n~1����L����_�H���y�W9/�{9ݕ�_��i����ҺЧ��P��A�Յ�����/]�X%
@@ -0,0 +1 @@
1
+ 4b11fa83c00a3c04cfb47775ffcd226167d52044
@@ -0,0 +1 @@
1
+ 4b11fa83c00a3c04cfb47775ffcd226167d52044
@@ -7,6 +7,15 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
7
7
 
8
8
  ## [Unreleased]
9
9
 
10
+ ## [0.2.29]
11
+
12
+ - feat: Update llama.cpp to ggerganov/llama.cpp@4483396751c79dea540808b9cb9238245d06da2b
13
+ - feat: Add split_mode option by @abetlen in 84615adbc6855c8384807c42f0130f9a1763f99d
14
+ - feat: Implement GGUF metadata KV overrides by @phiharri in #1011
15
+ - fix: Avoid "LookupError: unknown encoding: ascii" when open() called in a destructor by @yieldthought in #1012
16
+ - fix: Fix low_level_api_chat_cpp example to match current API by @aniljava in #1086
17
+ - fix: Fix Pydantic model parsing by @DeNeutoy in #1087
18
+
10
19
  ## [0.2.28]
11
20
 
12
21
  - feat: Update llama.cpp to ggerganov/llama.cpp@6efb8eb30e7025b168f3fda3ff83b9b386428ad6
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: llama_cpp_python
3
- Version: 0.2.28
3
+ Version: 0.2.29
4
4
  Summary: Python bindings for the llama.cpp library
5
5
  Author-Email: Andrei Betlen <abetlen@gmail.com>
6
6
  License: MIT
@@ -106,7 +106,7 @@ def gpt_params_parse(argv = None):
106
106
  parser.add_argument("--mirostat_lr", type=float, default=0.1, help="Mirostat learning rate, parameter eta",dest="mirostat_eta")
107
107
 
108
108
  parser.add_argument("-m", "--model", type=str, default="./models/llama-7B/ggml-model.bin", help="model path",dest="model")
109
- parser.add_argument("-p", "--prompt", type=str, default="", help="initial prompt",dest="prompt")
109
+ parser.add_argument("-p", "--prompt", type=str, default=None, help="initial prompt",dest="prompt")
110
110
  parser.add_argument("-f", "--file", type=str, default=None, help="file containing initial prompt to load",dest="file")
111
111
  parser.add_argument("--session", type=str, default=None, help="file to cache model state in (may be large!)",dest="path_session")
112
112
  parser.add_argument("--in-prefix", type=str, default="", help="string to prefix user inputs with", dest="input_prefix")
@@ -62,7 +62,7 @@ specified) expect poor results""", file=sys.stderr)
62
62
  self.multibyte_fix = []
63
63
 
64
64
  # model load
65
- self.lparams = llama_cpp.llama_context_default_params()
65
+ self.lparams = llama_cpp.llama_model_default_params()
66
66
  self.lparams.n_ctx = self.params.n_ctx
67
67
  self.lparams.n_parts = self.params.n_parts
68
68
  self.lparams.seed = self.params.seed
@@ -72,7 +72,11 @@ specified) expect poor results""", file=sys.stderr)
72
72
 
73
73
  self.model = llama_cpp.llama_load_model_from_file(
74
74
  self.params.model.encode("utf8"), self.lparams)
75
- self.ctx = llama_cpp.llama_new_context_with_model(self.model, self.lparams)
75
+
76
+ # Context Params.
77
+ self.cparams = llama_cpp.llama_context_default_params()
78
+
79
+ self.ctx = llama_cpp.llama_new_context_with_model(self.model, self.cparams)
76
80
  if (not self.ctx):
77
81
  raise RuntimeError(f"error: failed to load model '{self.params.model}'")
78
82
 
@@ -244,7 +248,7 @@ n_keep = {self.params.n_keep}
244
248
  # tokenize a prompt
245
249
  def _tokenize(self, prompt, bos=True):
246
250
  _arr = (llama_cpp.llama_token * ((len(prompt) + 1) * 4))()
247
- _n = llama_cpp.llama_tokenize(self.ctx, prompt.encode("utf8", errors="ignore"), _arr, len(_arr), bos)
251
+ _n = llama_cpp.llama_tokenize(self.model, prompt.encode("utf8", errors="ignore"), len(prompt), _arr, len(_arr), bos, False)
248
252
  return _arr[:_n]
249
253
 
250
254
  def set_color(self, c):
@@ -304,7 +308,7 @@ n_keep = {self.params.n_keep}
304
308
  self.n_past += n_eval"""
305
309
 
306
310
  if (llama_cpp.llama_eval(
307
- self.ctx, (llama_cpp.llama_token * len(self.embd))(*self.embd), len(self.embd), self.n_past, self.params.n_threads
311
+ self.ctx, (llama_cpp.llama_token * len(self.embd))(*self.embd), len(self.embd), self.n_past
308
312
  ) != 0):
309
313
  raise Exception("Failed to llama_eval!")
310
314
 
@@ -332,7 +336,7 @@ n_keep = {self.params.n_keep}
332
336
  id = 0
333
337
 
334
338
  logits = llama_cpp.llama_get_logits(self.ctx)
335
- n_vocab = llama_cpp.llama_n_vocab(self.ctx)
339
+ n_vocab = llama_cpp.llama_n_vocab(self.model)
336
340
 
337
341
  # Apply params.logit_bias map
338
342
  for key, value in self.params.logit_bias.items():
@@ -349,12 +353,20 @@ n_keep = {self.params.n_keep}
349
353
  last_n_repeat = min(len(self.last_n_tokens), repeat_last_n, self.n_ctx)
350
354
 
351
355
  _arr = (llama_cpp.llama_token * last_n_repeat)(*self.last_n_tokens[len(self.last_n_tokens) - last_n_repeat:])
352
- llama_cpp.llama_sample_repetition_penalty(self.ctx, candidates_p,
353
- _arr,
354
- last_n_repeat, llama_cpp.c_float(self.params.repeat_penalty))
355
- llama_cpp.llama_sample_frequency_and_presence_penalties(self.ctx, candidates_p,
356
- _arr,
357
- last_n_repeat, llama_cpp.c_float(self.params.frequency_penalty), llama_cpp.c_float(self.params.presence_penalty))
356
+ llama_cpp.llama_sample_repetition_penalties(
357
+ ctx=self.ctx,
358
+ candidates=candidates_p,
359
+ last_tokens_data = _arr,
360
+ penalty_last_n = last_n_repeat,
361
+ penalty_repeat = llama_cpp.c_float(self.params.repeat_penalty),
362
+ penalty_freq = llama_cpp.c_float(self.params.frequency_penalty),
363
+ penalty_present = llama_cpp.c_float(self.params.presence_penalty),
364
+ )
365
+
366
+ # NOT PRESENT IN CURRENT VERSION ?
367
+ # llama_cpp.llama_sample_frequency_and_presence_penalti(self.ctx, candidates_p,
368
+ # _arr,
369
+ # last_n_repeat, llama_cpp.c_float(self.params.frequency_penalty), llama_cpp.c_float(self.params.presence_penalty))
358
370
 
359
371
  if not self.params.penalize_nl:
360
372
  logits[llama_cpp.llama_token_nl()] = nl_logit
@@ -473,7 +485,7 @@ n_keep = {self.params.n_keep}
473
485
  def token_to_str(self, token_id: int) -> bytes:
474
486
  size = 32
475
487
  buffer = (ctypes.c_char * size)()
476
- n = llama_cpp.llama_token_to_piece_with_model(
488
+ n = llama_cpp.llama_token_to_piece(
477
489
  self.model, llama_cpp.llama_token(token_id), buffer, size)
478
490
  assert n <= size
479
491
  return bytes(buffer[:n])
@@ -532,6 +544,9 @@ n_keep = {self.params.n_keep}
532
544
  print(i,end="",flush=True)
533
545
  self.params.input_echo = False
534
546
 
547
+ # Using string instead of tokens to check for antiprompt,
548
+ # It is more reliable than tokens for interactive mode.
549
+ generated_str = ""
535
550
  while self.params.interactive:
536
551
  self.set_color(util.CONSOLE_COLOR_USER_INPUT)
537
552
  if (self.params.instruct):
@@ -546,6 +561,10 @@ n_keep = {self.params.n_keep}
546
561
  try:
547
562
  for i in self.output():
548
563
  print(i,end="",flush=True)
564
+ generated_str += i
565
+ for ap in self.params.antiprompt:
566
+ if generated_str.endswith(ap):
567
+ raise KeyboardInterrupt
549
568
  except KeyboardInterrupt:
550
569
  self.set_color(util.CONSOLE_COLOR_DEFAULT)
551
570
  if not self.params.instruct:
@@ -561,7 +580,7 @@ if __name__ == "__main__":
561
580
  time_now = datetime.now()
562
581
  prompt = f"""Text transcript of a never ending dialog, where {USER_NAME} interacts with an AI assistant named {AI_NAME}.
563
582
  {AI_NAME} is helpful, kind, honest, friendly, good at writing and never fails to answer {USER_NAME}’s requests immediately and with details and precision.
564
- There are no annotations like (30 seconds passed...) or (to himself), just what {USER_NAME} and {AI_NAME} say aloud to each other.
583
+ Transcript below contains only the recorded dialog between two, without any annotations like (30 seconds passed...) or (to himself), just what {USER_NAME} and {AI_NAME} say aloud to each other.
565
584
  The dialog lasts for years, the entirety of it is shared below. It's 10000 pages long.
566
585
  The transcript only includes text, it does not include markup like HTML and Markdown.
567
586
 
@@ -575,8 +594,11 @@ The transcript only includes text, it does not include markup like HTML and Mark
575
594
  {AI_NAME}: A cat is a domestic species of small carnivorous mammal. It is the only domesticated species in the family Felidae.
576
595
  {USER_NAME}: Name a color.
577
596
  {AI_NAME}: Blue
578
- {USER_NAME}:"""
597
+ {USER_NAME}: """
598
+
579
599
  params = gpt_params_parse()
600
+ if params.prompt is None and params.file is None:
601
+ params.prompt = prompt
580
602
 
581
603
  with LLaMAInteract(params) as m:
582
604
  m.interact()
@@ -1,4 +1,4 @@
1
1
  from .llama_cpp import *
2
2
  from .llama import *
3
3
 
4
- __version__ = "0.2.28"
4
+ __version__ = "0.2.29"
@@ -1,11 +1,15 @@
1
1
  import os
2
2
  import sys
3
3
 
4
+ import sys, traceback
5
+
6
+ # Avoid "LookupError: unknown encoding: ascii" when open() called in a destructor
7
+ outnull_file = open(os.devnull, "w")
8
+ errnull_file = open(os.devnull, "w")
4
9
 
5
10
  class suppress_stdout_stderr(object):
6
11
  # NOTE: these must be "saved" here to avoid exceptions when using
7
12
  # this context manager inside of a __del__ method
8
- open = open
9
13
  sys = sys
10
14
  os = os
11
15
 
@@ -21,9 +25,6 @@ class suppress_stdout_stderr(object):
21
25
  if not hasattr(self.sys.stdout, 'fileno') or not hasattr(self.sys.stderr, 'fileno'):
22
26
  return self # Return the instance without making changes
23
27
 
24
- self.outnull_file = self.open(self.os.devnull, "w")
25
- self.errnull_file = self.open(self.os.devnull, "w")
26
-
27
28
  self.old_stdout_fileno_undup = self.sys.stdout.fileno()
28
29
  self.old_stderr_fileno_undup = self.sys.stderr.fileno()
29
30
 
@@ -33,11 +34,11 @@ class suppress_stdout_stderr(object):
33
34
  self.old_stdout = self.sys.stdout
34
35
  self.old_stderr = self.sys.stderr
35
36
 
36
- self.os.dup2(self.outnull_file.fileno(), self.old_stdout_fileno_undup)
37
- self.os.dup2(self.errnull_file.fileno(), self.old_stderr_fileno_undup)
37
+ self.os.dup2(outnull_file.fileno(), self.old_stdout_fileno_undup)
38
+ self.os.dup2(errnull_file.fileno(), self.old_stderr_fileno_undup)
38
39
 
39
- self.sys.stdout = self.outnull_file
40
- self.sys.stderr = self.errnull_file
40
+ self.sys.stdout = outnull_file
41
+ self.sys.stderr = errnull_file
41
42
  return self
42
43
 
43
44
  def __exit__(self, *_):
@@ -54,6 +55,3 @@ class suppress_stdout_stderr(object):
54
55
 
55
56
  self.os.close(self.old_stdout_fileno)
56
57
  self.os.close(self.old_stderr_fileno)
57
-
58
- self.outnull_file.close()
59
- self.errnull_file.close()
@@ -730,11 +730,13 @@ class Llama:
730
730
  *,
731
731
  # Model Params
732
732
  n_gpu_layers: int = 0,
733
+ split_mode: int = llama_cpp.LLAMA_SPLIT_LAYER,
733
734
  main_gpu: int = 0,
734
735
  tensor_split: Optional[List[float]] = None,
735
736
  vocab_only: bool = False,
736
737
  use_mmap: bool = True,
737
738
  use_mlock: bool = False,
739
+ kv_overrides: Optional[Dict[str, Union[bool, int, float]]] = None,
738
740
  # Context Params
739
741
  seed: int = llama_cpp.LLAMA_DEFAULT_SEED,
740
742
  n_ctx: int = 512,
@@ -798,11 +800,13 @@ class Llama:
798
800
  Args:
799
801
  model_path: Path to the model.
800
802
  n_gpu_layers: Number of layers to offload to GPU (-ngl). If -1, all layers are offloaded.
801
- main_gpu: The GPU that is used for scratch and small tensors.
803
+ split_mode: How to split the model across GPUs. See llama_cpp.LLAMA_SPLIT_* for options.
804
+ main_gpu: main_gpu interpretation depends on split_mode: LLAMA_SPLIT_NONE: the GPU that is used for the entire model. LLAMA_SPLIT_ROW: the GPU that is used for small tensors and intermediate results. LLAMA_SPLIT_LAYER: ignored
802
805
  tensor_split: How split tensors should be distributed across GPUs. If None, the model is not split.
803
806
  vocab_only: Only load the vocabulary no weights.
804
807
  use_mmap: Use mmap if possible.
805
808
  use_mlock: Force the system to keep the model in RAM.
809
+ kv_overrides: Key-value overrides for the model.
806
810
  seed: RNG seed, -1 for random
807
811
  n_ctx: Text context, 0 = from model
808
812
  n_batch: Prompt processing maximum batch size
@@ -848,6 +852,7 @@ class Llama:
848
852
  self.model_params.n_gpu_layers = (
849
853
  0x7FFFFFFF if n_gpu_layers == -1 else n_gpu_layers
850
854
  ) # 0x7FFFFFFF is INT32 max, will be auto set to all layers
855
+ self.model_params.split_mode = split_mode
851
856
  self.model_params.main_gpu = main_gpu
852
857
  self.tensor_split = tensor_split
853
858
  self._c_tensor_split = None
@@ -866,6 +871,34 @@ class Llama:
866
871
  self.model_params.use_mmap = use_mmap if lora_path is None else False
867
872
  self.model_params.use_mlock = use_mlock
868
873
 
874
+ self.kv_overrides = kv_overrides
875
+ if kv_overrides is not None:
876
+ n_overrides = len(kv_overrides)
877
+ self._kv_overrides_array = llama_cpp.llama_model_kv_override * (n_overrides + 1)
878
+ self._kv_overrides_array_keys = []
879
+
880
+ for k, v in kv_overrides.items():
881
+ key_buf = ctypes.create_string_buffer(k.encode("utf-8"))
882
+ self._kv_overrides_array_keys.append(key_buf)
883
+ self._kv_overrides_array[i].key = key_buf
884
+ if isinstance(v, int):
885
+ self._kv_overrides_array[i].tag = llama_cpp.LLAMA_KV_OVERRIDE_INT
886
+ self._kv_overrides_array[i].value.int_value = v
887
+ elif isinstance(v, float):
888
+ self._kv_overrides_array[i].tag = llama_cpp.LLAMA_KV_OVERRIDE_FLOAT
889
+ self._kv_overrides_array[i].value.float_value = v
890
+ elif isinstance(v, bool):
891
+ self._kv_overrides_array[i].tag = llama_cpp.LLAMA_KV_OVERRIDE_BOOL
892
+ self._kv_overrides_array[i].value.bool_value = v
893
+ else:
894
+ raise ValueError(f"Unknown value type for {k}: {v}")
895
+
896
+ self._kv_overrides_array_sentinel_key = b'\0'
897
+
898
+ # null array sentinel
899
+ self._kv_overrides_array[n_overrides].key = self._kv_overrides_array_sentinel_key
900
+ self.model_params.kv_overrides = self._kv_overrides_array
901
+
869
902
  self.n_batch = min(n_ctx, n_batch) # ???
870
903
  self.n_threads = n_threads or max(multiprocessing.cpu_count() // 2, 1)
871
904
  self.n_threads_batch = n_threads_batch or max(
@@ -2143,11 +2176,13 @@ class Llama:
2143
2176
  model_path=self.model_path,
2144
2177
  # Model Params
2145
2178
  n_gpu_layers=self.model_params.n_gpu_layers,
2179
+ split_mode=self.model_params.split_mode,
2146
2180
  main_gpu=self.model_params.main_gpu,
2147
2181
  tensor_split=self.tensor_split,
2148
2182
  vocab_only=self.model_params.vocab_only,
2149
2183
  use_mmap=self.model_params.use_mmap,
2150
2184
  use_mlock=self.model_params.use_mlock,
2185
+ kv_overrides=self.kv_overrides,
2151
2186
  # Context Params
2152
2187
  seed=self.context_params.seed,
2153
2188
  n_ctx=self.context_params.n_ctx,
@@ -2185,11 +2220,13 @@ class Llama:
2185
2220
  model_path=state["model_path"],
2186
2221
  # Model Params
2187
2222
  n_gpu_layers=state["n_gpu_layers"],
2223
+ split_mode=state["split_mode"],
2188
2224
  main_gpu=state["main_gpu"],
2189
2225
  tensor_split=state["tensor_split"],
2190
2226
  vocab_only=state["vocab_only"],
2191
2227
  use_mmap=state["use_mmap"],
2192
2228
  use_mlock=state["use_mlock"],
2229
+ kv_overrides=state["kv_overrides"],
2193
2230
  # Context Params
2194
2231
  seed=state["seed"],
2195
2232
  n_ctx=state["n_ctx"],
@@ -112,8 +112,8 @@ LLAMA_FILE_MAGIC_GGSN = 0x6767736E
112
112
 
113
113
  # define LLAMA_SESSION_MAGIC LLAMA_FILE_MAGIC_GGSN
114
114
  LLAMA_SESSION_MAGIC = LLAMA_FILE_MAGIC_GGSN
115
- # define LLAMA_SESSION_VERSION 3
116
- LLAMA_SESSION_VERSION = 3
115
+ # define LLAMA_SESSION_VERSION 4
116
+ LLAMA_SESSION_VERSION = 4
117
117
 
118
118
 
119
119
  # struct llama_model;
@@ -180,6 +180,8 @@ LLAMA_TOKEN_TYPE_BYTE = 6
180
180
  # LLAMA_FTYPE_MOSTLY_Q5_K_M = 17, // except 1d tensors
181
181
  # LLAMA_FTYPE_MOSTLY_Q6_K = 18, // except 1d tensors
182
182
  # LLAMA_FTYPE_MOSTLY_IQ2_XXS = 19, // except 1d tensors
183
+ # LLAMA_FTYPE_MOSTLY_IQ2_XS = 20, // except 1d tensors
184
+ # LLAMA_FTYPE_MOSTLY_Q2_K_S = 21, // except 1d tensors
183
185
 
184
186
  # LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
185
187
  # };
@@ -200,6 +202,9 @@ LLAMA_FTYPE_MOSTLY_Q4_K_M = 15
200
202
  LLAMA_FTYPE_MOSTLY_Q5_K_S = 16
201
203
  LLAMA_FTYPE_MOSTLY_Q5_K_M = 17
202
204
  LLAMA_FTYPE_MOSTLY_Q6_K = 18
205
+ LLAMA_FTYPE_MOSTLY_IQ2_XXS = 19
206
+ LLAMA_FTYPE_MOSTLY_IQ2_XS = 20
207
+ LLAMA_FTYPE_MOSTLY_Q2_K_S = 21
203
208
  LLAMA_FTYPE_GUESSED = 1024
204
209
 
205
210
  # enum llama_rope_scaling_type {
@@ -215,6 +220,15 @@ LLAMA_ROPE_SCALING_LINEAR = 1
215
220
  LLAMA_ROPE_SCALING_YARN = 2
216
221
  LLAMA_ROPE_SCALING_MAX_VALUE = LLAMA_ROPE_SCALING_YARN
217
222
 
223
+ # enum llama_split_mode {
224
+ # LLAMA_SPLIT_NONE = 0, // single GPU
225
+ # LLAMA_SPLIT_LAYER = 1, // split layers and KV across GPUs
226
+ # LLAMA_SPLIT_ROW = 2, // split rows across GPUs
227
+ # };
228
+ LLAMA_SPLIT_NONE = 0
229
+ LLAMA_SPLIT_LAYER = 1
230
+ LLAMA_SPLIT_ROW = 2
231
+
218
232
 
219
233
  # typedef struct llama_token_data {
220
234
  # llama_token id; // token id
@@ -360,13 +374,22 @@ class llama_model_kv_override(Structure):
360
374
 
361
375
  # struct llama_model_params {
362
376
  # int32_t n_gpu_layers; // number of layers to store in VRAM
363
- # int32_t main_gpu; // the GPU that is used for scratch and small tensors
364
- # const float * tensor_split; // how to split layers across multiple GPUs (size: LLAMA_MAX_DEVICES)
377
+ # enum llama_split_mode split_mode; // how to split the model across multiple GPUs
378
+
379
+ # // main_gpu interpretation depends on split_mode:
380
+ # // LLAMA_SPLIT_NONE: the GPU that is used for the entire model
381
+ # // LLAMA_SPLIT_ROW: the GPU that is used for small tensors and intermediate results
382
+ # // LLAMA_SPLIT_LAYER: ignored
383
+ # int32_t main_gpu;
384
+
385
+ # // proportion of the model (layers or rows) to offload to each GPU, size: LLAMA_MAX_DEVICES
386
+ # const float * tensor_split;
365
387
 
366
388
  # // Called with a progress value between 0.0 and 1.0. Pass NULL to disable.
367
389
  # // If the provided progress_callback returns true, model loading continues.
368
390
  # // If it returns false, model loading is immediately aborted.
369
391
  # llama_progress_callback progress_callback;
392
+
370
393
  # // context pointer passed to the progress callback
371
394
  # void * progress_callback_user_data;
372
395
 
@@ -384,8 +407,9 @@ class llama_model_params(Structure):
384
407
 
385
408
  Attributes:
386
409
  n_gpu_layers (int): number of layers to store in VRAM
387
- main_gpu (int): the GPU that is used for scratch and small tensors
388
- tensor_split (ctypes.Array[ctypes.c_float]): how to split layers across multiple GPUs (size: LLAMA_MAX_DEVICES)
410
+ split_mode (int): how to split the model across multiple GPUs
411
+ main_gpu (int): the GPU that is used for the entire model. main_gpu interpretation depends on split_mode: LLAMA_SPLIT_NONE: the GPU that is used for the entire model LLAMA_SPLIT_ROW: the GPU that is used for small tensors and intermediate results LLAMA_SPLIT_LAYER: ignored
412
+ tensor_split (ctypes.Array[ctypes.c_float]): proportion of the model (layers or rows) to offload to each GPU, size: LLAMA_MAX_DEVICES
389
413
  progress_callback (llama_progress_callback): called with a progress value between 0.0 and 1.0. Pass NULL to disable. If the provided progress_callback returns true, model loading continues. If it returns false, model loading is immediately aborted.
390
414
  progress_callback_user_data (ctypes.c_void_p): context pointer passed to the progress callback
391
415
  kv_overrides (ctypes.Array[llama_model_kv_override]): override key-value pairs of the model meta data
@@ -395,6 +419,7 @@ class llama_model_params(Structure):
395
419
 
396
420
  _fields_ = [
397
421
  ("n_gpu_layers", c_int32),
422
+ ("split_mode", c_int),
398
423
  ("main_gpu", c_int32),
399
424
  ("tensor_split", c_float_p),
400
425
  ("progress_callback", llama_progress_callback),
@@ -503,6 +528,7 @@ It might not exist for progress report where '.' is output repeatedly."""
503
528
  # bool quantize_output_tensor; // quantize output.weight
504
529
  # bool only_copy; // only copy tensors - ftype, allow_requantize and quantize_output_tensor are ignored
505
530
  # bool pure; // disable k-quant mixtures and quantize all tensors to the same type
531
+ # void * imatrix; // pointer to importance matrix data
506
532
  # } llama_model_quantize_params;
507
533
  class llama_model_quantize_params(Structure):
508
534
  """Parameters for llama_model_quantize
@@ -514,6 +540,7 @@ class llama_model_quantize_params(Structure):
514
540
  quantize_output_tensor (bool): quantize output.weight
515
541
  only_copy (bool): only copy tensors - ftype, allow_requantize and quantize_output_tensor are ignored
516
542
  pure (bool): disable k-quant mixtures and quantize all tensors to the same type
543
+ imatrix (ctypes.c_void_p): pointer to importance matrix data
517
544
  """
518
545
 
519
546
  _fields_ = [
@@ -522,6 +549,8 @@ class llama_model_quantize_params(Structure):
522
549
  ("allow_requantize", c_bool),
523
550
  ("quantize_output_tensor", c_bool),
524
551
  ("only_copy", c_bool),
552
+ ("pure", c_bool),
553
+ ("imatrix", c_void_p),
525
554
  ]
526
555
 
527
556
 
@@ -1933,14 +1962,39 @@ _lib.llama_sample_repetition_penalties.restype = None
1933
1962
 
1934
1963
 
1935
1964
  # /// @details Apply classifier-free guidance to the logits as described in academic paper "Stay on topic with Classifier-Free Guidance" https://arxiv.org/abs/2306.17806
1936
- # /// @param candidates A vector of `llama_token_data` containing the candidate tokens, the logits must be directly extracted from the original generation context without being sorted.
1937
- # /// @params guidance_ctx A separate context from the same model. Other than a negative prompt at the beginning, it should have all generated and user input tokens copied from the main context.
1938
- # /// @params scale Guidance strength. 1.0f means no guidance. Higher values mean stronger guidance.
1939
- # LLAMA_API void llama_sample_classifier_free_guidance(
1940
- # struct llama_context * ctx,
1965
+ # /// @param logits Logits extracted from the original generation context.
1966
+ # /// @param logits_guidance Logits extracted from a separate context from the same model. Other than a negative prompt at the beginning, it should have all generated and user input tokens copied from the main context.
1967
+ # /// @param scale Guidance strength. 1.0f means no guidance. Higher values mean stronger guidance.
1968
+ # LLAMA_API void llama_sample_apply_guidance(
1969
+ # struct llama_context * ctx,
1970
+ # float * logits,
1971
+ # float * logits_guidance,
1972
+ # float scale);
1973
+ def llama_sample_apply_guidance(
1974
+ ctx: llama_context_p,
1975
+ logits, # type: _Pointer[c_float]
1976
+ logits_guidance, # type: _Pointer[c_float]
1977
+ scale: Union[c_float, float],
1978
+ ):
1979
+ """Apply classifier-free guidance to the logits as described in academic paper "Stay on topic with Classifier-Free Guidance" https://arxiv.org/abs/2306.17806"""
1980
+ return _lib.llama_sample_apply_guidance(ctx, logits, logits_guidance, scale)
1981
+
1982
+
1983
+ _lib.llama_sample_apply_guidance.argtypes = [
1984
+ llama_context_p,
1985
+ c_float_p,
1986
+ c_float_p,
1987
+ c_float,
1988
+ ]
1989
+ _lib.llama_sample_apply_guidance.restype = None
1990
+
1991
+
1992
+ # LLAMA_API DEPRECATED(void llama_sample_classifier_free_guidance(
1993
+ # struct llama_context * ctx,
1941
1994
  # llama_token_data_array * candidates,
1942
- # struct llama_context * guidance_ctx,
1943
- # float scale);
1995
+ # struct llama_context * guidance_ctx,
1996
+ # float scale),
1997
+ # "use llama_sample_apply_guidance() instead");
1944
1998
  def llama_sample_classifier_free_guidance(
1945
1999
  ctx: llama_context_p,
1946
2000
  candidates, # type: _Pointer[llama_token_data_array]
@@ -1433,7 +1433,6 @@ class SchemaConverter:
1433
1433
 
1434
1434
  def visit(self, schema: Dict[str, Any], name: str) -> str:
1435
1435
  schema_type: Optional[str] = schema.get("type") # type: ignore
1436
- assert isinstance(schema_type, str), f"Unrecognized schema: {schema}"
1437
1436
  rule_name = name or "root"
1438
1437
 
1439
1438
  if "$defs" in schema: