llama-cpp-python 0.2.34__tar.gz → 0.2.36__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- llama_cpp_python-0.2.36/.git/FETCH_HEAD +1 -0
- llama_cpp_python-0.2.36/.git/HEAD +1 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/config +1 -1
- llama_cpp_python-0.2.36/.git/index +0 -0
- llama_cpp_python-0.2.36/.git/logs/HEAD +1 -0
- llama_cpp_python-0.2.36/.git/modules/vendor/llama.cpp/HEAD +1 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/config +1 -1
- llama_cpp_python-0.2.36/.git/modules/vendor/llama.cpp/index +0 -0
- llama_cpp_python-0.2.36/.git/modules/vendor/llama.cpp/logs/HEAD +2 -0
- llama_cpp_python-0.2.36/.git/modules/vendor/llama.cpp/logs/refs/heads/master +1 -0
- llama_cpp_python-0.2.36/.git/modules/vendor/llama.cpp/logs/refs/remotes/origin/HEAD +1 -0
- llama_cpp_python-0.2.36/.git/modules/vendor/llama.cpp/objects/pack/pack-45c5d7da4d130e32bb1f98f3b58ea9cd2784fad3.idx +0 -0
- llama_cpp_python-0.2.34/.git/modules/vendor/llama.cpp/objects/pack/pack-1ad8805aff0ba166c9097b7c2bd8caee41b57147.pack → llama_cpp_python-0.2.36/.git/modules/vendor/llama.cpp/objects/pack/pack-45c5d7da4d130e32bb1f98f3b58ea9cd2784fad3.pack +0 -0
- llama_cpp_python-0.2.36/.git/modules/vendor/llama.cpp/objects/pack/pack-45c5d7da4d130e32bb1f98f3b58ea9cd2784fad3.rev +0 -0
- llama_cpp_python-0.2.36/.git/modules/vendor/llama.cpp/packed-refs +2 -0
- llama_cpp_python-0.2.36/.git/modules/vendor/llama.cpp/refs/heads/master +1 -0
- llama_cpp_python-0.2.36/.git/modules/vendor/llama.cpp/shallow +1 -0
- llama_cpp_python-0.2.34/.git/objects/6c/7c6db7f0dc20814bf39cba40760e9c468ee61d → llama_cpp_python-0.2.36/.git/objects/03/667ba9b14656308c89e62f61377b295604a99d +0 -0
- llama_cpp_python-0.2.36/.git/objects/46/4af5b39fea3cf1ba16e755a9df85f09bbb25ac +3 -0
- llama_cpp_python-0.2.36/.git/objects/54/66de3a4e33002429b33db9668367bb32af67eb +0 -0
- llama_cpp_python-0.2.36/.git/objects/7a/bb04aa9c0f718d18a085923cdb87a670cb5437 +0 -0
- llama_cpp_python-0.2.36/.git/objects/80/6b120c5e62a7be5fecc631e341d1856dac79a5 +2 -0
- llama_cpp_python-0.2.36/.git/objects/c1/0aee42e0da547428df7cac9845e246badf1803 +0 -0
- llama_cpp_python-0.2.36/.git/objects/e9/9dd1767bb3a30508e8a0de0e41bd426c13c387 +0 -0
- llama_cpp_python-0.2.36/.git/objects/f6/66a05325305ef8813f914ad5b909541bc8f786 +0 -0
- llama_cpp_python-0.2.36/.git/objects/f7/3f3d42f48aa84ceb664f490290d1840f6873e6 +0 -0
- llama_cpp_python-0.2.36/.git/objects/f7/9baa89ba3d84bc4b49e8ed314c018b9e4d4bbc +0 -0
- llama_cpp_python-0.2.36/.git/objects/fa/f4a87a2e4515dbf0dbea0cc64f91fc7b81b8bb +0 -0
- llama_cpp_python-0.2.36/.git/refs/tags/v0.2.36 +1 -0
- llama_cpp_python-0.2.36/.git/shallow +1 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/CHANGELOG.md +9 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/Makefile +3 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/PKG-INFO +54 -1
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/README.md +53 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/__init__.py +1 -1
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/llama_chat_format.py +18 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/tests/test_llama_chat_format.py +23 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/.devops/server-cuda.Dockerfile +32 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/.devops/server-intel.Dockerfile +25 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/.devops/server-rocm.Dockerfile +45 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/.devops/server.Dockerfile +20 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/build.yml +41 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/docker.yml +4 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/CMakeLists.txt +66 -6
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/Makefile +13 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/README.md +25 -3
- llama_cpp_python-0.2.36/vendor/llama.cpp/README_sycl.md +252 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ci/README.md +4 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ci/run.sh +11 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/build-info.cpp +1 -1
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/common.cpp +15 -11
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/convert-hf-to-gguf.py +81 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/convert.py +4 -1
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/CMakeLists.txt +3 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama-bench/llama-bench.cpp +8 -3
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/README.md +8 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/oai.hpp +15 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/server.cpp +63 -3
- llama_cpp_python-0.2.36/vendor/llama.cpp/examples/sycl/CMakeLists.txt +9 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/examples/sycl/README.md +47 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/examples/sycl/build.sh +20 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/examples/sycl/ls-sycl-device.cpp +11 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/examples/sycl/run-llama2.sh +19 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/flake.lock +3 -3
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-alloc.c +82 -24
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-backend-impl.h +6 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-backend.c +107 -2
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-backend.h +3 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-cuda.cu +3 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-metal.m +24 -20
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-opencl.cpp +11 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/ggml-sycl.cpp +15199 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/ggml-sycl.h +27 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/ggml-vulkan-shaders.hpp +61420 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/ggml-vulkan.cpp +5176 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/ggml-vulkan.h +34 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml.c +61 -4
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml.h +2 -0
- llama_cpp_python-0.2.36/vendor/llama.cpp/ggml_vk_generate_shaders.py +2362 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/gguf/constants.py +23 -1
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/llama.cpp +274 -12
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/llama.h +4 -1
- llama_cpp_python-0.2.36/vendor/llama.cpp/scripts/sync-ggml.last +1 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-backend-ops.cpp +8 -1
- llama_cpp_python-0.2.36/vendor/llama.cpp/tests/test-sampling.cpp +299 -0
- llama_cpp_python-0.2.34/.git/FETCH_HEAD +0 -1
- llama_cpp_python-0.2.34/.git/HEAD +0 -1
- llama_cpp_python-0.2.34/.git/index +0 -0
- llama_cpp_python-0.2.34/.git/logs/HEAD +0 -1
- llama_cpp_python-0.2.34/.git/modules/vendor/llama.cpp/HEAD +0 -1
- llama_cpp_python-0.2.34/.git/modules/vendor/llama.cpp/index +0 -0
- llama_cpp_python-0.2.34/.git/modules/vendor/llama.cpp/logs/HEAD +0 -2
- llama_cpp_python-0.2.34/.git/modules/vendor/llama.cpp/logs/refs/heads/master +0 -1
- llama_cpp_python-0.2.34/.git/modules/vendor/llama.cpp/logs/refs/remotes/origin/HEAD +0 -1
- llama_cpp_python-0.2.34/.git/modules/vendor/llama.cpp/objects/pack/pack-1ad8805aff0ba166c9097b7c2bd8caee41b57147.idx +0 -0
- llama_cpp_python-0.2.34/.git/modules/vendor/llama.cpp/objects/pack/pack-1ad8805aff0ba166c9097b7c2bd8caee41b57147.rev +0 -0
- llama_cpp_python-0.2.34/.git/modules/vendor/llama.cpp/packed-refs +0 -2
- llama_cpp_python-0.2.34/.git/modules/vendor/llama.cpp/refs/heads/master +0 -1
- llama_cpp_python-0.2.34/.git/modules/vendor/llama.cpp/refs/tags/b1988 +0 -1
- llama_cpp_python-0.2.34/.git/modules/vendor/llama.cpp/shallow +0 -1
- llama_cpp_python-0.2.34/.git/objects/1e/f18d9279e29c56c7eddc91aaf1acc0fac083e2 +0 -0
- llama_cpp_python-0.2.34/.git/objects/36/eacabdc4468738fdfc6534cbc1cf3fafe70ef3 +0 -0
- llama_cpp_python-0.2.34/.git/objects/5e/d3fa262bcd21936a7599d948af876c11807d1d +0 -0
- llama_cpp_python-0.2.34/.git/objects/78/13c96b0a30986613f544ea2983b9d65d64ef01 +0 -0
- llama_cpp_python-0.2.34/.git/objects/9b/9876b88067c66830cc8181d699b5c1a65c3394 +0 -0
- llama_cpp_python-0.2.34/.git/objects/a9/d09e96d4e4906da5bef8870e1c366a87aaa8f4 +0 -0
- llama_cpp_python-0.2.34/.git/objects/af/ebe4ecadc7030a02e412fe0cf8476d5b261266 +0 -0
- llama_cpp_python-0.2.34/.git/objects/c1/d0fff8a990b1e3ebede2f2abf0f6350b2c30a3 +0 -0
- llama_cpp_python-0.2.34/.git/objects/dd/f1d0d6d092eb4d209ec861de65b37eccd5a685 +0 -0
- llama_cpp_python-0.2.34/.git/objects/e4/18d40bc9300928be896c4381d9b08372417c83 +0 -0
- llama_cpp_python-0.2.34/.git/refs/tags/v0.2.34 +0 -1
- llama_cpp_python-0.2.34/.git/shallow +0 -1
- llama_cpp_python-0.2.34/vendor/llama.cpp/scripts/sync-ggml.last +0 -1
- llama_cpp_python-0.2.34/vendor/llama.cpp/tests/test-sampling.cpp +0 -160
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.dockerignore +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/description +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/applypatch-msg.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/commit-msg.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/fsmonitor-watchman.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/post-update.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/pre-applypatch.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/pre-commit.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/pre-merge-commit.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/pre-push.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/pre-rebase.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/pre-receive.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/prepare-commit-msg.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/push-to-checkout.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/sendemail-validate.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/hooks/update.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/info/exclude +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/description +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/applypatch-msg.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/commit-msg.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/fsmonitor-watchman.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/post-update.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/pre-applypatch.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/pre-commit.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/pre-merge-commit.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/pre-push.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/pre-rebase.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/pre-receive.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/prepare-commit-msg.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/push-to-checkout.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/sendemail-validate.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/hooks/update.sample +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/info/exclude +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/modules/vendor/llama.cpp/refs/remotes/origin/HEAD +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/02/c09afb0bf5559d3fe64ce67f4ff82af32ff50f +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/04/5856ea2ffe697ec33db1c1c989bd45cde5bb3d +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/04/7bc14424303575f73af90611fec827334f54e8 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/0d/870969f4b23bd92a09ec29134d3fb454d38bec +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/0e/2a907c0e40de1a432ee0cd2e3d01c634df1a37 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/11/2a0f7872fa9244bf38729a2722dc5c08dec20c +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/11/b6d5c26e3f7157658952b8ec353e985d522fac +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/13/c5b6b0df5f67e80cbe584909b83777901265a1 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/19/9bd4ffbf88c68c98b52c05f388dfa92716f6b7 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/1a/5152530cfbde487c928b60269a29fa5219f617 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/23/e37d4d40e5ec0bfd85b5e928834d58e2cf0da6 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/24/04228325d88c59b819acaedb20b15635f75df9 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/27/2e4767b47397d1529e6a2d01298144d9d746ba +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/27/a6b1e5042318f85dc99c9f24f4dd6fc472d242 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/29/03e0146d304bcacbfabfe71f171a2edc03043e +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/2c/c6fb02dcb3226c1ecf0fbed6453eb3acadeaa2 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/36/8022c457f6dd5bb566f7e2a21d88850bd98768 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/39/697bfc2538bd4558018d0d721d6d6028c4bb56 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/3a/1d7180d508818fe957923e00dcd8950938632d +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/3a/6457dcdfd47e764654bacae0ba8347976b645a +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/3d/d00767671c5e9dac5a2ab8f4f1331531294b60 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/41/3097201ac0fc27ef4dcf518b699a6fb610a54c +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/41/cc68ea2402cf682807649d841e7c0f4175db01 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/47/4503fdfc554d8caabee4f321a80427f8c7d696 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/4a/106470b0b650cd76f2f5d00d744b615c72bed3 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/4b/3189dd1a54be3bc416786ddf184dd047dc4b20 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/51/f357200f8b998031f4be924e11ed2ae4bf3fea +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/56/2410fe1a4c4093d62e1705933eaf66c6d99a2c +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/5f/350ffe99abe7297b2839f36fd0eaeb98887805 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/60/bc7aef42aac0409cfdca666ad2ff6f516d7b5b +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/61/027ef99725c50b0891fdbf0bf263a33abe648f +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/68/7316b327ca038d26a338b3070a7d4698322515 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/74/739cbdeccf282532e1684caac6846aab3a7afe +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/74/7c6130e3cb1479d20e2013b1dd3db3379c2266 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/76/e26fbd106895fba52861f8ac1e11cc6ee2a307 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/79/5dad726ae91f330c56e49bc188080b5b3b5ba9 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/79/a9e67a1aee09c6d182f240ba5eef32feabcbce +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/7a/7b899ec7dd48d192cba14ac9c8e9df4233f7fb +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/7d/5498f9d2c49c1f731b47845d845f6c5e16a3d9 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/7d/6c970483161eaf43cfa9d50010c071d4953053 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/7e/df0975dc12ccc95ad14de085f07efe6d65c620 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/7e/e8f748eab47180cea09c0ad8e75c3b991b4af4 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/80/7b0f57a8a873e58ade0ff0f5b0bcf0ff66b7f9 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/82/e5c4487e57d6d59c901a73bdd2a9bc172fee7c +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/8b/d03f88a1895cbf3ef249e13df79ee0efda779d +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/91/abb11fdf507883caeeb2d2958e1c65fb6cbdc1 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/99/32d6130f5552a9b85c8b15b4ac6bc26b1068ce +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/9d/0ec2f705618e591cfa8d6512cb9a96b3da75f1 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/9d/3d3559849603efda6f3c8181684e4d19e0ec79 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/9e/9870a52245d4f245df5a4e1b89fda121d78214 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/9f/0dc8a73c5bd91cea7580e9ea733f33528162db +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/a4/5e5d77363eb85144d4aff1a3cbe86ce94d5c92 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/a9/e51cdc1672134ec9af66c9eccf09f6da4ceccd +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/ac/82b8fbb81087ec9b3a72d9e377102a31b28d16 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/ac/aabd74d800e2a957097d56acd931e72129e7f0 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/b1/f90b91594f496ad9f27b1a68584984f4b523d2 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/b9/1632f5bc787c1404600c894a6a4126359747d8 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/bb/b68069d5f8125d64af0baffbd4695f1a0f729c +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/bb/cbbe7d61558adde3cbfd0c7a63a67c27ed6d30 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/c3/deba87b41117da6624f6d92a016ce50239dfc3 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/c4/256dd4ce7908b76e2215415b9bba7911a8deee +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/c8/5e73d2b657bb05ed99309615d67bac93d9f86e +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/ca/ebbb67fdb02a0a8897d4e4826ea046a9931f6f +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/cb/221880a66e3c1f2ca15a9df52ac4bcb765e7d4 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/cc/6a3a7252ea6e698614f0629d4bc040ab6ca717 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/cd/351ba33849dcf6af35b493f7405962fa1625d4 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/d1/ae9b564d3ab02c6b91162e52d822d36524edb3 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/d3/329eec3bac6ce7e54c76b77ac9bf99fab0fe3f +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/d3/efb3a6fe1e001db62ec08e5d31ce1d08567045 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/d8/ef563c2dc69fe1ea223be7bc5b0efc27ad1f9c +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/da/c33b74dddf06fcfc01244044eebb102cfcea37 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/e2/13518b95011cb6ee783986624c3b6de8659f81 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/e4/1f375774e6945e445bfb179502b128fe22dda7 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/e6/9de29bb2d1d6434b8b29ae775ad8c2e48c5391 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/eb/0fb9662e690d0f9de4632cddd321b3f872a725 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/eb/9a2cfa9167df02f136502af79738c71363abfd +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/ec/47c421648c0a57c37cef86f4c5c435fb3b81ff +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/ef/1b2c0162e8edd321e2b9c1ce375d96f1f1d048 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/f0/827d762e852a21f6406c469300899d5f509b8f +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/f1/b8e9d154231932c4b7b9b59611626764e68632 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/f2/0813765a70679e8a063871c9ef75d75c65ccb6 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/fa/dfc5fb4fe6f5eb6d5d98b62519e374a5202b00 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/fc/25ff5160028dee3570249abc40cd57780bcca9 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/fc/ef8cd800ee8a265b146748d178cb56b5632bf3 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/fd/64c09b37947c97e58903ce570785c657d56722 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/fe/b0ed68d94eac48b844fd587ddfb808649716a1 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.git/objects/ff/3e950cd1110fe552912cea4c268c4023d2b737 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.github/dependabot.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.github/workflows/build-and-release.yaml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.github/workflows/build-docker.yaml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.github/workflows/publish-to-test.yaml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.github/workflows/publish.yaml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.github/workflows/test-pypi.yaml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.github/workflows/test.yaml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.gitignore +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.gitmodules +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/.readthedocs.yaml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/LICENSE.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docker/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docker/cuda_simple/Dockerfile +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docker/open_llama/Dockerfile +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docker/open_llama/build.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docker/open_llama/hug_model.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docker/open_llama/start.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docker/open_llama/start_server.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docker/openblas_simple/Dockerfile +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docker/simple/Dockerfile +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docker/simple/run.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docs/api-reference.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docs/changelog.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docs/index.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docs/install/macos.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docs/requirements.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/docs/server.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/high_level_api/fastapi_server.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/high_level_api/high_level_api_embedding.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/high_level_api/high_level_api_inference.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/high_level_api/high_level_api_streaming.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/high_level_api/langchain_custom_llm.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/low_level_api/Chat.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/low_level_api/Miku.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/low_level_api/ReasonAct.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/low_level_api/common.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/low_level_api/low_level_api_chat_cpp.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/low_level_api/low_level_api_llama_cpp.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/low_level_api/quantize.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/low_level_api/readme/low_level_api_llama_cpp.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/low_level_api/util.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/notebooks/Batching.ipynb +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/notebooks/Clients.ipynb +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/notebooks/Functions.ipynb +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/notebooks/Guidance.ipynb +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/notebooks/Multimodal.ipynb +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/examples/notebooks/PerformanceTuning.ipynb +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/_internals.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/_utils.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/llama.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/llama_cache.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/llama_cpp.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/llama_grammar.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/llama_types.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/llava_cpp.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/py.typed +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/server/__init__.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/server/__main__.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/server/app.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/server/cli.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/server/errors.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/server/model.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/server/settings.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/llama_cpp/server/types.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/mkdocs.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/pyproject.toml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/tests/test_grammar.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/tests/test_llama.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.clang-tidy +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/cloud-v-pipeline +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/full-cuda.Dockerfile +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/full-rocm.Dockerfile +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/full.Dockerfile +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/main-cuda.Dockerfile +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/main-intel.Dockerfile +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/main-rocm.Dockerfile +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/main.Dockerfile +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/nix/apps.nix +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/nix/devshells.nix +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/nix/jetson-support.nix +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/nix/nixpkgs-instances.nix +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/nix/package.nix +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/nix/scope.nix +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.devops/tools.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.dockerignore +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.ecrc +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.editorconfig +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.flake8 +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.git +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/ISSUE_TEMPLATE/bug.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/ISSUE_TEMPLATE/enhancement.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/code-coverage.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/editorconfig.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/gguf-publish.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/nix-ci-aarch64.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/nix-ci.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/nix-flake-update.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/nix-publish-flake.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/python-check-requirements.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/python-lint.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/tidy-post.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/tidy-review.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/zig-build.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.gitignore +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.pre-commit-config.yaml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/LICENSE +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/Package.swift +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/SHA256SUMS +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/awq-py/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/awq-py/awq/apply_awq.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/awq-py/requirements.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/build.zig +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/cmake/FindSIMD.cmake +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/codecov.yml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/base64.hpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/build-info.cpp.in +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/common.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/console.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/console.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/grammar-parser.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/grammar-parser.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/log.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/sampling.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/sampling.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/stb_image.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/train.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/common/train.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/convert-llama-ggml-to-gguf.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/convert-lora-to-ggml.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/convert-persimmon-to-gguf.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/docs/BLIS.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/docs/llama-star/idea-arch.key +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/docs/llama-star/idea-arch.pdf +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/docs/token_generation_performance_tips.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/Miku.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/alpaca.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/baby-llama/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/baby-llama/baby-llama.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/base-translate.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/batched/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/batched/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/batched/batched.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/batched-bench/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/batched-bench/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/batched-bench/batched-bench.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/batched.swift/.gitignore +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/batched.swift/Makefile +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/batched.swift/Package.swift +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/batched.swift/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/batched.swift/Sources/main.swift +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/beam-search/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/beam-search/beam-search.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/benchmark/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/benchmark/benchmark-matmult.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/chat-13B.bat +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/chat-13B.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/chat-persistent.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/chat-vicuna.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/chat.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/convert-llama2c-to-ggml/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/convert-llama2c-to-ggml/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/convert-llama2c-to-ggml/convert-llama2c-to-ggml.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/embedding/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/embedding/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/embedding/embedding.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/export-lora/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/export-lora/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/export-lora/export-lora.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/finetune/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/finetune/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/finetune/convert-finetune-checkpoint-to-gguf.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/finetune/finetune.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/finetune/finetune.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/gguf/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/gguf/gguf.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/gpt4all.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/imatrix/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/imatrix/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/imatrix/imatrix.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/infill/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/infill/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/infill/infill.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/jeopardy/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/jeopardy/graph.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/jeopardy/jeopardy.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/jeopardy/qasheet.csv +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/jeopardy/questions.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/json-schema-to-grammar.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama-bench/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama-bench/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/.gitignore +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/.gitignore +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/build.gradle.kts +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/proguard-rules.pro +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/AndroidManifest.xml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/cpp/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/cpp/llama-android.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/java/com/example/llama/Downloadable.kt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/java/com/example/llama/Llm.kt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/java/com/example/llama/MainActivity.kt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/java/com/example/llama/MainViewModel.kt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/java/com/example/llama/ui/theme/Color.kt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/java/com/example/llama/ui/theme/Theme.kt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/java/com/example/llama/ui/theme/Type.kt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/drawable/ic_launcher_background.xml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/drawable/ic_launcher_foreground.xml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/mipmap-anydpi/ic_launcher.xml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/mipmap-anydpi/ic_launcher_round.xml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/mipmap-hdpi/ic_launcher.webp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/mipmap-hdpi/ic_launcher_round.webp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/mipmap-mdpi/ic_launcher.webp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/mipmap-mdpi/ic_launcher_round.webp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/mipmap-xhdpi/ic_launcher.webp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/mipmap-xhdpi/ic_launcher_round.webp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/mipmap-xxhdpi/ic_launcher.webp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/mipmap-xxhdpi/ic_launcher_round.webp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/mipmap-xxxhdpi/ic_launcher.webp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/mipmap-xxxhdpi/ic_launcher_round.webp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/values/colors.xml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/values/strings.xml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/values/themes.xml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/xml/backup_rules.xml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/app/src/main/res/xml/data_extraction_rules.xml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/build.gradle.kts +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/gradle/wrapper/gradle-wrapper.jar +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/gradle/wrapper/gradle-wrapper.properties +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/gradle.properties +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/gradlew +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.android/settings.gradle.kts +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/.gitignore +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/llama.cpp.swift/LibLlama.swift +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Assets.xcassets/AppIcon.appiconset/Contents.json +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Assets.xcassets/Contents.json +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Models/LlamaState.swift +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/ContentView.swift +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/DownloadButton.swift +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/InputButton.swift +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/LoadCustomButton.swift +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/llama_swiftuiApp.swift +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui.xcodeproj/project.pbxproj +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui.xcodeproj/project.xcworkspace/contents.xcworkspacedata +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui.xcodeproj/project.xcworkspace/xcshareddata/IDEWorkspaceChecks.plist +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama.vim +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama2-13b.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llama2.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llava/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llava/MobileVLM-README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llava/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llava/android/adb_run.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llava/android/build_64.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llava/clip.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llava/clip.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llava/convert-image-encoder-to-gguf.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llava/llava-cli.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llava/llava-surgery.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llava/llava.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llava/llava.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/llm.vim +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/lookahead/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/lookahead/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/lookahead/lookahead.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/lookup/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/lookup/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/lookup/lookup.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/main/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/main/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/main/main.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/main-cmake-pkg/.gitignore +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/main-cmake-pkg/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/main-cmake-pkg/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/make-ggml.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/parallel/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/parallel/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/parallel/parallel.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/passkey/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/passkey/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/passkey/passkey.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/perplexity/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/perplexity/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/perplexity/perplexity.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/pydantic-models-to-grammar-examples.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/pydantic_models_to_grammar.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/quantize/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/quantize/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/quantize/quantize.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/quantize-stats/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/quantize-stats/quantize-stats.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/reason-act.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/save-load-state/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/save-load-state/save-load-state.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/api_like_OAI.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/chat-llama2.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/chat.mjs +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/chat.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/completion.js.hpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/deps.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/httplib.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/index.html.hpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/index.js.hpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/json-schema-to-grammar.mjs.hpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/json.hpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/public/completion.js +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/public/index.html +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/public/index.js +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/public/json-schema-to-grammar.mjs +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server/utils.hpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/server-llama2-13B.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/simple/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/simple/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/simple/simple.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/speculative/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/speculative/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/speculative/speculative.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/tokenize/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/tokenize/tokenize.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/train-text-from-scratch/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/train-text-from-scratch/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/train-text-from-scratch/convert-train-checkpoint-to-gguf.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/examples/train-text-from-scratch/train-text-from-scratch.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/flake.nix +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-alloc.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-cuda.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-impl.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-metal.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-metal.metal +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-mpi.c +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-mpi.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-opencl.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-quants.c +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/ggml-quants.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/LICENSE +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/examples/writer.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/gguf/__init__.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/gguf/gguf.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/gguf/gguf_reader.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/gguf/gguf_writer.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/gguf/py.typed +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/gguf/tensor_mapping.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/gguf/vocab.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/pyproject.toml +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/scripts/__init__.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/scripts/gguf-convert-endian.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/scripts/gguf-dump.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/scripts/gguf-set-metadata.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/gguf-py/tests/test_gguf.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/grammars/README.md +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/grammars/arithmetic.gbnf +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/grammars/c.gbnf +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/grammars/chess.gbnf +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/grammars/japanese.gbnf +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/grammars/json.gbnf +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/grammars/json_arr.gbnf +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/grammars/list.gbnf +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/media/llama-leader.jpeg +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/media/llama0-banner.png +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/media/llama0-logo.png +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/media/llama1-banner.png +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/media/llama1-logo.png +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/mypy.ini +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/pocs/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/pocs/vdot/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/pocs/vdot/q8dot.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/pocs/vdot/vdot.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/LLM-questions.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/alpaca.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/assistant.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/chat-with-baichuan.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/chat-with-bob.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/chat-with-qwen.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/chat-with-vicuna-v0.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/chat-with-vicuna-v1.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/chat.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/dan-modified.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/dan.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/mnemonics.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/parallel-questions.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/prompts/reason-act.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/requirements/requirements-convert-hf-to-gguf.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/requirements/requirements-convert-llama-ggml-to-gguf.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/requirements/requirements-convert-lora-to-ggml.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/requirements/requirements-convert-persimmon-to-gguf.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/requirements/requirements-convert.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/requirements.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/LlamaConfig.cmake.in +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/build-info.cmake +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/build-info.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/check-requirements.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/ci-run.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/compare-llama-bench.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/convert-gg.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/gen-build-info-cpp.cmake +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/get-flags.mk +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/get-hellaswag.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/get-pg.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/get-wikitext-2.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/get-winogrande.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/qnt-all.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/run-all-perf.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/run-all-ppl.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/run-with-preset.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/server-llm.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/sync-ggml-am.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/sync-ggml.sh +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/scripts/verify-checksum-models.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/spm-headers/llama.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/.gitignore +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/get-model.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/get-model.h +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-autorelease.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-c.c +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-double-float.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-grad0.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-grammar-parser.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-llama-grammar.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-model-load-cancel.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-opt.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-quantize-fns.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-quantize-perf.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-rope.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-tokenizer-0-falcon.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-tokenizer-0-falcon.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-tokenizer-0-llama.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-tokenizer-0-llama.py +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-tokenizer-1-bpe.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/tests/test-tokenizer-1-llama.cpp +0 -0
- {llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/unicode.h +0 -0
|
@@ -0,0 +1 @@
|
|
|
1
|
+
464af5b39fea3cf1ba16e755a9df85f09bbb25ac '464af5b39fea3cf1ba16e755a9df85f09bbb25ac' of https://github.com/abetlen/llama-cpp-python
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
464af5b39fea3cf1ba16e755a9df85f09bbb25ac
|
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
[gc]
|
|
10
10
|
auto = 0
|
|
11
11
|
[http "https://github.com/"]
|
|
12
|
-
extraheader = AUTHORIZATION: basic
|
|
12
|
+
extraheader = AUTHORIZATION: basic eC1hY2Nlc3MtdG9rZW46Z2hzX1Y2cUFITVRmZ0hoM1VTanhaR2VKRTRhUGxXUHJjRzQwRWhTSg==
|
|
13
13
|
[submodule "vendor/llama.cpp"]
|
|
14
14
|
active = true
|
|
15
15
|
url = https://github.com/ggerganov/llama.cpp.git
|
|
Binary file
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
0000000000000000000000000000000000000000 464af5b39fea3cf1ba16e755a9df85f09bbb25ac runner <runner@fv-az695-903.gmayhch2cacunn5b1cp1zlasod.dx.internal.cloudapp.net> 1706543240 +0000 checkout: moving from master to refs/tags/v0.2.36
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
2aed77eb06a329f0d82bb1c467f4244904d4073f
|
|
@@ -13,7 +13,7 @@
|
|
|
13
13
|
[gc]
|
|
14
14
|
auto = 0
|
|
15
15
|
[http "https://github.com/"]
|
|
16
|
-
extraheader = AUTHORIZATION: basic
|
|
16
|
+
extraheader = AUTHORIZATION: basic eC1hY2Nlc3MtdG9rZW46Z2hzX1Y2cUFITVRmZ0hoM1VTanhaR2VKRTRhUGxXUHJjRzQwRWhTSg==
|
|
17
17
|
[url "https://github.com/"]
|
|
18
18
|
insteadOf = git@github.com:
|
|
19
19
|
insteadOf = org-6826477@github.com:
|
|
Binary file
|
|
@@ -0,0 +1,2 @@
|
|
|
1
|
+
0000000000000000000000000000000000000000 2aed77eb06a329f0d82bb1c467f4244904d4073f runner <runner@fv-az695-903.gmayhch2cacunn5b1cp1zlasod.dx.internal.cloudapp.net> 1706543241 +0000 clone: from https://github.com/ggerganov/llama.cpp.git
|
|
2
|
+
2aed77eb06a329f0d82bb1c467f4244904d4073f 2aed77eb06a329f0d82bb1c467f4244904d4073f runner <runner@fv-az695-903.gmayhch2cacunn5b1cp1zlasod.dx.internal.cloudapp.net> 1706543241 +0000 checkout: moving from master to 2aed77eb06a329f0d82bb1c467f4244904d4073f
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
0000000000000000000000000000000000000000 2aed77eb06a329f0d82bb1c467f4244904d4073f runner <runner@fv-az695-903.gmayhch2cacunn5b1cp1zlasod.dx.internal.cloudapp.net> 1706543241 +0000 clone: from https://github.com/ggerganov/llama.cpp.git
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
0000000000000000000000000000000000000000 2aed77eb06a329f0d82bb1c467f4244904d4073f runner <runner@fv-az695-903.gmayhch2cacunn5b1cp1zlasod.dx.internal.cloudapp.net> 1706543241 +0000 clone: from https://github.com/ggerganov/llama.cpp.git
|
|
Binary file
|
|
Binary file
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
2aed77eb06a329f0d82bb1c467f4244904d4073f
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
2aed77eb06a329f0d82bb1c467f4244904d4073f
|
|
Binary file
|
|
@@ -0,0 +1,2 @@
|
|
|
1
|
+
x�TMo1����r��E����6�F��HU[!�ڀ�wmٻT(��ػҲ������<ϛT�>|���]e8+E�t��݃,\ɔ"��,�Ui�y��4�T�SjEVY'w��z+ډ�k�B�z�S��,ʌ��+�z�R
|
|
2
|
+
��kY@�\),!\�ߗ]|�����T��e\x��%����u I+���w¦� ���egx�fߍ����|Х�$������k���Bk��$�E��D/�x�j��/��dߪ�*٦9�M���(l�8����?~a}r�����h'�gW�-+Z4��xr���ҕ�y���Ű7�Vha������W�����Ҍ���]��
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
464af5b39fea3cf1ba16e755a9df85f09bbb25ac
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
464af5b39fea3cf1ba16e755a9df85f09bbb25ac
|
|
@@ -7,6 +7,15 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
|
|
|
7
7
|
|
|
8
8
|
## [Unreleased]
|
|
9
9
|
|
|
10
|
+
## [0.2.36]
|
|
11
|
+
|
|
12
|
+
- feat: Update llama.cpp to ggerganov/llama.cpp@2aed77eb06a329f0d82bb1c467f4244904d4073f
|
|
13
|
+
- feat: Add mistral instruct chat format as "mistral-instruct" by @Rafaelblsilva in #799
|
|
14
|
+
|
|
15
|
+
## [0.2.35]
|
|
16
|
+
|
|
17
|
+
- feat: Update llama.cpp to ggerganov/llama.cpp@d2f650cb5b04ee2726663e79b47da5efe196ce00
|
|
18
|
+
|
|
10
19
|
## [0.2.34]
|
|
11
20
|
|
|
12
21
|
- feat: Update llama.cpp to ggerganov/llama.cpp@6db2b41a76ee78d5efdd5c3cddd5d7ad3f646855
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: llama_cpp_python
|
|
3
|
-
Version: 0.2.
|
|
3
|
+
Version: 0.2.36
|
|
4
4
|
Summary: Python bindings for the llama.cpp library
|
|
5
5
|
Author-Email: Andrei Betlen <abetlen@gmail.com>
|
|
6
6
|
License: MIT
|
|
@@ -259,6 +259,59 @@ Note that `chat_format` option must be set for the particular model you are usin
|
|
|
259
259
|
|
|
260
260
|
Chat completion is available through the [`create_chat_completion`](https://llama-cpp-python.readthedocs.io/en/latest/api-reference/#llama_cpp.Llama.create_chat_completion) method of the [`Llama`](https://llama-cpp-python.readthedocs.io/en/latest/api-reference/#llama_cpp.Llama) class.
|
|
261
261
|
|
|
262
|
+
### JSON and JSON Schema Mode
|
|
263
|
+
|
|
264
|
+
If you want to constrain chat responses to only valid JSON or a specific JSON Schema you can use the `response_format` argument to the `create_chat_completion` method.
|
|
265
|
+
|
|
266
|
+
#### JSON Mode
|
|
267
|
+
|
|
268
|
+
The following example will constrain the response to be valid JSON.
|
|
269
|
+
|
|
270
|
+
```python
|
|
271
|
+
>>> from llama_cpp import Llama
|
|
272
|
+
>>> llm = Llama(model_path="path/to/model.gguf", chat_format="chatml")
|
|
273
|
+
>>> llm.create_chat_completion(
|
|
274
|
+
messages=[
|
|
275
|
+
{
|
|
276
|
+
"role": "system",
|
|
277
|
+
"content": "You are a helpful assistant that outputs in JSON.",
|
|
278
|
+
},
|
|
279
|
+
{"role": "user", "content": "Who won the world series in 2020"},
|
|
280
|
+
],
|
|
281
|
+
response_format={
|
|
282
|
+
"type": "json_object",
|
|
283
|
+
},
|
|
284
|
+
temperature=0.7,
|
|
285
|
+
)
|
|
286
|
+
```
|
|
287
|
+
|
|
288
|
+
#### JSON Schema Mode
|
|
289
|
+
|
|
290
|
+
To constrain the response to a specific JSON Schema, you can use the `schema` property of the `response_format` argument.
|
|
291
|
+
|
|
292
|
+
```python
|
|
293
|
+
>>> from llama_cpp import Llama
|
|
294
|
+
>>> llm = Llama(model_path="path/to/model.gguf", chat_format="chatml")
|
|
295
|
+
>>> llm.create_chat_completion(
|
|
296
|
+
messages=[
|
|
297
|
+
{
|
|
298
|
+
"role": "system",
|
|
299
|
+
"content": "You are a helpful assistant that outputs in JSON.",
|
|
300
|
+
},
|
|
301
|
+
{"role": "user", "content": "Who won the world series in 2020"},
|
|
302
|
+
],
|
|
303
|
+
response_format={
|
|
304
|
+
"type": "json_object",
|
|
305
|
+
"schema": {
|
|
306
|
+
"type": "object",
|
|
307
|
+
"properties": {"team_name": {"type": "string"}},
|
|
308
|
+
"required": ["team_name"],
|
|
309
|
+
},
|
|
310
|
+
},
|
|
311
|
+
temperature=0.7,
|
|
312
|
+
)
|
|
313
|
+
```
|
|
314
|
+
|
|
262
315
|
### Function Calling
|
|
263
316
|
|
|
264
317
|
The high-level API also provides a simple interface for function calling.
|
|
@@ -216,6 +216,59 @@ Note that `chat_format` option must be set for the particular model you are usin
|
|
|
216
216
|
|
|
217
217
|
Chat completion is available through the [`create_chat_completion`](https://llama-cpp-python.readthedocs.io/en/latest/api-reference/#llama_cpp.Llama.create_chat_completion) method of the [`Llama`](https://llama-cpp-python.readthedocs.io/en/latest/api-reference/#llama_cpp.Llama) class.
|
|
218
218
|
|
|
219
|
+
### JSON and JSON Schema Mode
|
|
220
|
+
|
|
221
|
+
If you want to constrain chat responses to only valid JSON or a specific JSON Schema you can use the `response_format` argument to the `create_chat_completion` method.
|
|
222
|
+
|
|
223
|
+
#### JSON Mode
|
|
224
|
+
|
|
225
|
+
The following example will constrain the response to be valid JSON.
|
|
226
|
+
|
|
227
|
+
```python
|
|
228
|
+
>>> from llama_cpp import Llama
|
|
229
|
+
>>> llm = Llama(model_path="path/to/model.gguf", chat_format="chatml")
|
|
230
|
+
>>> llm.create_chat_completion(
|
|
231
|
+
messages=[
|
|
232
|
+
{
|
|
233
|
+
"role": "system",
|
|
234
|
+
"content": "You are a helpful assistant that outputs in JSON.",
|
|
235
|
+
},
|
|
236
|
+
{"role": "user", "content": "Who won the world series in 2020"},
|
|
237
|
+
],
|
|
238
|
+
response_format={
|
|
239
|
+
"type": "json_object",
|
|
240
|
+
},
|
|
241
|
+
temperature=0.7,
|
|
242
|
+
)
|
|
243
|
+
```
|
|
244
|
+
|
|
245
|
+
#### JSON Schema Mode
|
|
246
|
+
|
|
247
|
+
To constrain the response to a specific JSON Schema, you can use the `schema` property of the `response_format` argument.
|
|
248
|
+
|
|
249
|
+
```python
|
|
250
|
+
>>> from llama_cpp import Llama
|
|
251
|
+
>>> llm = Llama(model_path="path/to/model.gguf", chat_format="chatml")
|
|
252
|
+
>>> llm.create_chat_completion(
|
|
253
|
+
messages=[
|
|
254
|
+
{
|
|
255
|
+
"role": "system",
|
|
256
|
+
"content": "You are a helpful assistant that outputs in JSON.",
|
|
257
|
+
},
|
|
258
|
+
{"role": "user", "content": "Who won the world series in 2020"},
|
|
259
|
+
],
|
|
260
|
+
response_format={
|
|
261
|
+
"type": "json_object",
|
|
262
|
+
"schema": {
|
|
263
|
+
"type": "object",
|
|
264
|
+
"properties": {"team_name": {"type": "string"}},
|
|
265
|
+
"required": ["team_name"],
|
|
266
|
+
},
|
|
267
|
+
},
|
|
268
|
+
temperature=0.7,
|
|
269
|
+
)
|
|
270
|
+
```
|
|
271
|
+
|
|
219
272
|
### Function Calling
|
|
220
273
|
|
|
221
274
|
The high-level API also provides a simple interface for function calling.
|
|
@@ -877,6 +877,24 @@ def format_chatml(
|
|
|
877
877
|
return ChatFormatterResponse(prompt=_prompt, stop=_sep)
|
|
878
878
|
|
|
879
879
|
|
|
880
|
+
@register_chat_format("mistral-instruct")
|
|
881
|
+
def format_mistral_instruct(
|
|
882
|
+
messages: List[llama_types.ChatCompletionRequestMessage],
|
|
883
|
+
**kwargs: Any,
|
|
884
|
+
) -> ChatFormatterResponse:
|
|
885
|
+
bos = "<s>"
|
|
886
|
+
eos = "</s>"
|
|
887
|
+
stop = eos
|
|
888
|
+
prompt = bos
|
|
889
|
+
for message in messages:
|
|
890
|
+
if message["role"] == "user" and message["content"] is not None and isinstance(message["content"], str):
|
|
891
|
+
prompt += "[INST] " + message["content"]
|
|
892
|
+
elif message["role"] == "assistant" and message["content"] is not None and isinstance(message["content"], str):
|
|
893
|
+
prompt += " [/INST]" + message["content"] + eos
|
|
894
|
+
prompt += " [/INST]"
|
|
895
|
+
return ChatFormatterResponse(prompt=prompt, stop=stop)
|
|
896
|
+
|
|
897
|
+
|
|
880
898
|
@register_chat_format("chatglm3")
|
|
881
899
|
def format_chatglm3(
|
|
882
900
|
messages: List[llama_types.ChatCompletionRequestMessage],
|
|
@@ -1,10 +1,33 @@
|
|
|
1
1
|
import json
|
|
2
2
|
|
|
3
|
+
import jinja2
|
|
4
|
+
|
|
3
5
|
from llama_cpp import (
|
|
4
6
|
ChatCompletionRequestUserMessage,
|
|
5
7
|
)
|
|
8
|
+
import llama_cpp.llama_types as llama_types
|
|
9
|
+
import llama_cpp.llama_chat_format as llama_chat_format
|
|
10
|
+
|
|
6
11
|
from llama_cpp.llama_chat_format import hf_tokenizer_config_to_chat_formatter
|
|
7
12
|
|
|
13
|
+
def test_mistral_instruct():
|
|
14
|
+
chat_template = "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ '[INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}"
|
|
15
|
+
chat_formatter = jinja2.Template(chat_template)
|
|
16
|
+
messages = [
|
|
17
|
+
llama_types.ChatCompletionRequestUserMessage(role="user", content="Instruction"),
|
|
18
|
+
llama_types.ChatCompletionRequestAssistantMessage(role="assistant", content="Model answer"),
|
|
19
|
+
llama_types.ChatCompletionRequestUserMessage(role="user", content="Follow-up instruction"),
|
|
20
|
+
]
|
|
21
|
+
response = llama_chat_format.format_mistral_instruct(
|
|
22
|
+
messages=messages,
|
|
23
|
+
)
|
|
24
|
+
reference = chat_formatter.render(
|
|
25
|
+
messages=messages,
|
|
26
|
+
bos_token="<s>",
|
|
27
|
+
eos_token="</s>",
|
|
28
|
+
)
|
|
29
|
+
assert response.prompt == reference
|
|
30
|
+
|
|
8
31
|
|
|
9
32
|
mistral_7b_tokenizer_config = """{
|
|
10
33
|
"add_bos_token": true,
|
|
@@ -0,0 +1,32 @@
|
|
|
1
|
+
ARG UBUNTU_VERSION=22.04
|
|
2
|
+
# This needs to generally match the container host's environment.
|
|
3
|
+
ARG CUDA_VERSION=11.7.1
|
|
4
|
+
# Target the CUDA build image
|
|
5
|
+
ARG BASE_CUDA_DEV_CONTAINER=nvidia/cuda:${CUDA_VERSION}-devel-ubuntu${UBUNTU_VERSION}
|
|
6
|
+
# Target the CUDA runtime image
|
|
7
|
+
ARG BASE_CUDA_RUN_CONTAINER=nvidia/cuda:${CUDA_VERSION}-runtime-ubuntu${UBUNTU_VERSION}
|
|
8
|
+
|
|
9
|
+
FROM ${BASE_CUDA_DEV_CONTAINER} as build
|
|
10
|
+
|
|
11
|
+
# Unless otherwise specified, we make a fat build.
|
|
12
|
+
ARG CUDA_DOCKER_ARCH=all
|
|
13
|
+
|
|
14
|
+
RUN apt-get update && \
|
|
15
|
+
apt-get install -y build-essential git
|
|
16
|
+
|
|
17
|
+
WORKDIR /app
|
|
18
|
+
|
|
19
|
+
COPY . .
|
|
20
|
+
|
|
21
|
+
# Set nvcc architecture
|
|
22
|
+
ENV CUDA_DOCKER_ARCH=${CUDA_DOCKER_ARCH}
|
|
23
|
+
# Enable cuBLAS
|
|
24
|
+
ENV LLAMA_CUBLAS=1
|
|
25
|
+
|
|
26
|
+
RUN make
|
|
27
|
+
|
|
28
|
+
FROM ${BASE_CUDA_RUN_CONTAINER} as runtime
|
|
29
|
+
|
|
30
|
+
COPY --from=build /app/server /server
|
|
31
|
+
|
|
32
|
+
ENTRYPOINT [ "/server" ]
|
|
@@ -0,0 +1,25 @@
|
|
|
1
|
+
ARG ONEAPI_VERSION=2024.0.1-devel-ubuntu22.04
|
|
2
|
+
ARG UBUNTU_VERSION=22.04
|
|
3
|
+
|
|
4
|
+
FROM intel/hpckit:$ONEAPI_VERSION as build
|
|
5
|
+
|
|
6
|
+
RUN apt-get update && \
|
|
7
|
+
apt-get install -y git
|
|
8
|
+
|
|
9
|
+
WORKDIR /app
|
|
10
|
+
|
|
11
|
+
COPY . .
|
|
12
|
+
|
|
13
|
+
# for some reasons, "-DLLAMA_BLAS=ON -DLLAMA_BLAS_VENDOR=Intel10_64lp -DLLAMA_NATIVE=ON" give worse performance
|
|
14
|
+
RUN mkdir build && \
|
|
15
|
+
cd build && \
|
|
16
|
+
cmake .. -DCMAKE_C_COMPILER=icx -DCMAKE_CXX_COMPILER=icpx && \
|
|
17
|
+
cmake --build . --config Release --target main server
|
|
18
|
+
|
|
19
|
+
FROM ubuntu:$UBUNTU_VERSION as runtime
|
|
20
|
+
|
|
21
|
+
COPY --from=build /app/build/bin/server /server
|
|
22
|
+
|
|
23
|
+
ENV LC_ALL=C.utf8
|
|
24
|
+
|
|
25
|
+
ENTRYPOINT [ "/server" ]
|
|
@@ -0,0 +1,45 @@
|
|
|
1
|
+
ARG UBUNTU_VERSION=22.04
|
|
2
|
+
|
|
3
|
+
# This needs to generally match the container host's environment.
|
|
4
|
+
ARG ROCM_VERSION=5.6
|
|
5
|
+
|
|
6
|
+
# Target the CUDA build image
|
|
7
|
+
ARG BASE_ROCM_DEV_CONTAINER=rocm/dev-ubuntu-${UBUNTU_VERSION}:${ROCM_VERSION}-complete
|
|
8
|
+
|
|
9
|
+
FROM ${BASE_ROCM_DEV_CONTAINER} as build
|
|
10
|
+
|
|
11
|
+
# Unless otherwise specified, we make a fat build.
|
|
12
|
+
# List from https://github.com/ggerganov/llama.cpp/pull/1087#issuecomment-1682807878
|
|
13
|
+
# This is mostly tied to rocBLAS supported archs.
|
|
14
|
+
ARG ROCM_DOCKER_ARCH=\
|
|
15
|
+
gfx803 \
|
|
16
|
+
gfx900 \
|
|
17
|
+
gfx906 \
|
|
18
|
+
gfx908 \
|
|
19
|
+
gfx90a \
|
|
20
|
+
gfx1010 \
|
|
21
|
+
gfx1030 \
|
|
22
|
+
gfx1100 \
|
|
23
|
+
gfx1101 \
|
|
24
|
+
gfx1102
|
|
25
|
+
|
|
26
|
+
COPY requirements.txt requirements.txt
|
|
27
|
+
COPY requirements requirements
|
|
28
|
+
|
|
29
|
+
RUN pip install --upgrade pip setuptools wheel \
|
|
30
|
+
&& pip install -r requirements.txt
|
|
31
|
+
|
|
32
|
+
WORKDIR /app
|
|
33
|
+
|
|
34
|
+
COPY . .
|
|
35
|
+
|
|
36
|
+
# Set nvcc architecture
|
|
37
|
+
ENV GPU_TARGETS=${ROCM_DOCKER_ARCH}
|
|
38
|
+
# Enable ROCm
|
|
39
|
+
ENV LLAMA_HIPBLAS=1
|
|
40
|
+
ENV CC=/opt/rocm/llvm/bin/clang
|
|
41
|
+
ENV CXX=/opt/rocm/llvm/bin/clang++
|
|
42
|
+
|
|
43
|
+
RUN make
|
|
44
|
+
|
|
45
|
+
ENTRYPOINT [ "/app/server" ]
|
|
@@ -0,0 +1,20 @@
|
|
|
1
|
+
ARG UBUNTU_VERSION=22.04
|
|
2
|
+
|
|
3
|
+
FROM ubuntu:$UBUNTU_VERSION as build
|
|
4
|
+
|
|
5
|
+
RUN apt-get update && \
|
|
6
|
+
apt-get install -y build-essential git
|
|
7
|
+
|
|
8
|
+
WORKDIR /app
|
|
9
|
+
|
|
10
|
+
COPY . .
|
|
11
|
+
|
|
12
|
+
RUN make
|
|
13
|
+
|
|
14
|
+
FROM ubuntu:$UBUNTU_VERSION as runtime
|
|
15
|
+
|
|
16
|
+
COPY --from=build /app/server /server
|
|
17
|
+
|
|
18
|
+
ENV LC_ALL=C.utf8
|
|
19
|
+
|
|
20
|
+
ENTRYPOINT [ "/server" ]
|
{llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/build.yml
RENAMED
|
@@ -143,6 +143,47 @@ jobs:
|
|
|
143
143
|
cd build
|
|
144
144
|
ctest -L main --verbose
|
|
145
145
|
|
|
146
|
+
ubuntu-22-cmake-sycl:
|
|
147
|
+
runs-on: ubuntu-22.04
|
|
148
|
+
|
|
149
|
+
continue-on-error: true
|
|
150
|
+
|
|
151
|
+
steps:
|
|
152
|
+
- uses: actions/checkout@v2
|
|
153
|
+
|
|
154
|
+
- name: add oneAPI to apt
|
|
155
|
+
shell: bash
|
|
156
|
+
run: |
|
|
157
|
+
cd /tmp
|
|
158
|
+
wget https://apt.repos.intel.com/intel-gpg-keys/GPG-PUB-KEY-INTEL-SW-PRODUCTS.PUB
|
|
159
|
+
sudo apt-key add GPG-PUB-KEY-INTEL-SW-PRODUCTS.PUB
|
|
160
|
+
rm GPG-PUB-KEY-INTEL-SW-PRODUCTS.PUB
|
|
161
|
+
sudo add-apt-repository "deb https://apt.repos.intel.com/oneapi all main"
|
|
162
|
+
|
|
163
|
+
- name: install oneAPI dpcpp compiler
|
|
164
|
+
shell: bash
|
|
165
|
+
run: |
|
|
166
|
+
sudo apt update
|
|
167
|
+
sudo apt install intel-oneapi-compiler-dpcpp-cpp
|
|
168
|
+
|
|
169
|
+
- name: install oneAPI MKL library
|
|
170
|
+
shell: bash
|
|
171
|
+
run: |
|
|
172
|
+
sudo apt install intel-oneapi-mkl-devel
|
|
173
|
+
|
|
174
|
+
- name: Clone
|
|
175
|
+
id: checkout
|
|
176
|
+
uses: actions/checkout@v3
|
|
177
|
+
|
|
178
|
+
- name: Build
|
|
179
|
+
id: cmake_build
|
|
180
|
+
run: |
|
|
181
|
+
source /opt/intel/oneapi/setvars.sh
|
|
182
|
+
mkdir build
|
|
183
|
+
cd build
|
|
184
|
+
cmake -DLLAMA_SYCL=ON -DCMAKE_C_COMPILER=icx -DCMAKE_CXX_COMPILER=icpx ..
|
|
185
|
+
cmake --build . --config Release -j $(nproc)
|
|
186
|
+
|
|
146
187
|
# TODO: build with LLAMA_NO_METAL because test-backend-ops fail on "Apple Paravirtual device" and I don't know
|
|
147
188
|
# how to debug it.
|
|
148
189
|
# ref: https://github.com/ggerganov/llama.cpp/actions/runs/7131777249/job/19420981052#step:5:1124
|
{llama_cpp_python-0.2.34 → llama_cpp_python-0.2.36}/vendor/llama.cpp/.github/workflows/docker.yml
RENAMED
|
@@ -28,14 +28,18 @@ jobs:
|
|
|
28
28
|
config:
|
|
29
29
|
- { tag: "light", dockerfile: ".devops/main.Dockerfile", platforms: "linux/amd64,linux/arm64" }
|
|
30
30
|
- { tag: "full", dockerfile: ".devops/full.Dockerfile", platforms: "linux/amd64,linux/arm64" }
|
|
31
|
+
- { tag: "server", dockerfile: ".devops/server.Dockerfile", platforms: "linux/amd64,linux/arm64" }
|
|
31
32
|
# NOTE(canardletter): The CUDA builds on arm64 are very slow, so I
|
|
32
33
|
# have disabled them for now until the reason why
|
|
33
34
|
# is understood.
|
|
34
35
|
- { tag: "light-cuda", dockerfile: ".devops/main-cuda.Dockerfile", platforms: "linux/amd64" }
|
|
35
36
|
- { tag: "full-cuda", dockerfile: ".devops/full-cuda.Dockerfile", platforms: "linux/amd64" }
|
|
37
|
+
- { tag: "server-cuda", dockerfile: ".devops/server-cuda.Dockerfile", platforms: "linux/amd64" }
|
|
36
38
|
- { tag: "light-rocm", dockerfile: ".devops/main-rocm.Dockerfile", platforms: "linux/amd64,linux/arm64" }
|
|
37
39
|
- { tag: "full-rocm", dockerfile: ".devops/full-rocm.Dockerfile", platforms: "linux/amd64,linux/arm64" }
|
|
40
|
+
- { tag: "server-rocm", dockerfile: ".devops/server-rocm.Dockerfile", platforms: "linux/amd64,linux/arm64" }
|
|
38
41
|
- { tag: "light-intel", dockerfile: ".devops/main-intel.Dockerfile", platforms: "linux/amd64" }
|
|
42
|
+
- { tag: "server-intel", dockerfile: ".devops/server-intel.Dockerfile", platforms: "linux/amd64" }
|
|
39
43
|
steps:
|
|
40
44
|
- name: Check out the repo
|
|
41
45
|
uses: actions/checkout@v3
|