llama-cpp-python 0.2.28__tar.gz → 0.2.29__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- llama_cpp_python-0.2.29/.git/FETCH_HEAD +1 -0
- llama_cpp_python-0.2.29/.git/HEAD +1 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/config +1 -1
- llama_cpp_python-0.2.29/.git/index +0 -0
- llama_cpp_python-0.2.29/.git/logs/HEAD +1 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/HEAD +1 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/config +1 -1
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/index +0 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/logs/HEAD +2 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/logs/refs/heads/master +1 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/logs/refs/remotes/origin/HEAD +1 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/objects/pack/pack-089f43df9dfbcbef5693213d630b739a6bd96e17.idx +0 -0
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/objects/pack/pack-51c0c02c987a3a975ed4edb03bbd1999de104e16.pack → llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/objects/pack/pack-089f43df9dfbcbef5693213d630b739a6bd96e17.pack +0 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/objects/pack/pack-089f43df9dfbcbef5693213d630b739a6bd96e17.rev +0 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/packed-refs +2 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/refs/heads/master +1 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/refs/tags/b1878 +1 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/shallow +1 -0
- llama_cpp_python-0.2.29/.git/objects/02/c09afb0bf5559d3fe64ce67f4ff82af32ff50f +0 -0
- llama_cpp_python-0.2.29/.git/objects/03/6b2ddd1f34297fc03f715b82fd66945e9147ea +0 -0
- llama_cpp_python-0.2.29/.git/objects/1a/5152530cfbde487c928b60269a29fa5219f617 +0 -0
- llama_cpp_python-0.2.29/.git/objects/1b/78703a3fcd25c369a170cc7c94ca5a0a0e3baf +0 -0
- llama_cpp_python-0.2.29/.git/objects/4b/11fa83c00a3c04cfb47775ffcd226167d52044 +0 -0
- llama_cpp_python-0.2.29/.git/objects/50/6ab1f7ef5b87b110a38090b844b19b63c5bb8c +0 -0
- llama_cpp_python-0.2.29/.git/objects/65/206bf28d4bcaebea79c68bbd4e526aed5da6b3 +0 -0
- llama_cpp_python-0.2.29/.git/objects/6e/7ace3b7938f7c58a9ef2bf593c13691c03cf45 +0 -0
- llama_cpp_python-0.2.29/.git/objects/90/2a43919c5d79d1d418aee2d1512c2e92e8a00b +0 -0
- llama_cpp_python-0.2.29/.git/objects/9e/8e3cec752c06b0fd8cebdebbc6dcf7cade1a5a +0 -0
- llama_cpp_python-0.2.29/.git/objects/a4/5e5d77363eb85144d4aff1a3cbe86ce94d5c92 +0 -0
- llama_cpp_python-0.2.29/.git/objects/ba/14c5172dd87bbfcee083a5eac8c0511bb0c633 +0 -0
- llama_cpp_python-0.2.29/.git/objects/c0/2e656426ce672792fd20cb55c9616067974520 +0 -0
- llama_cpp_python-0.2.29/.git/objects/c0/748ee14e43d553bccbf402a4ed6c13b563b453 +0 -0
- llama_cpp_python-0.2.29/.git/objects/d1/ae9b564d3ab02c6b91162e52d822d36524edb3 +0 -0
- llama_cpp_python-0.2.29/.git/objects/e4/be9d1c98b789ed81b2d0fbdd28a441f267f489 +0 -0
- llama_cpp_python-0.2.29/.git/objects/ef/9392b7a3d1f6802cef539eea18185eb50c61af +2 -0
- llama_cpp_python-0.2.29/.git/objects/f7/b6ba6b1950c0c0a796d996f980e763bd9641cb +0 -0
- llama_cpp_python-0.2.29/.git/objects/f9/be3237d374ae1fa7e6d7e9587f17636b0a4f35 +0 -0
- llama_cpp_python-0.2.29/.git/refs/tags/v0.2.29 +1 -0
- llama_cpp_python-0.2.29/.git/shallow +1 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/CHANGELOG.md +9 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/PKG-INFO +1 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/common.py +1 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/low_level_api_chat_cpp.py +36 -14
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/__init__.py +1 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/_utils.py +9 -11
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/llama.py +38 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/llama_cpp.py +67 -13
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/llama_grammar.py +0 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/model.py +19 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/settings.py +8 -0
- llama_cpp_python-0.2.29/tests/test_grammar.py +52 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/.github/workflows/nix-ci-aarch64.yml +55 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/nix-ci.yml +0 -41
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/nix-flake-update.yml +1 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.gitignore +1 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/CMakeLists.txt +6 -2
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/Makefile +4 -10
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/Package.swift +1 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/awq-py/README.md +1 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/build-info.cpp +1 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/common.cpp +57 -29
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/common.h +3 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/sampling.cpp +5 -4
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert-hf-to-gguf.py +35 -13
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/CMakeLists.txt +1 -3
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched-bench/batched-bench.cpp +3 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/benchmark/benchmark-matmult.cpp +2 -2
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/export-lora/export-lora.cpp +1 -2
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/imatrix/CMakeLists.txt +5 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/imatrix/imatrix.cpp +380 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama-bench/llama-bench.cpp +78 -68
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Models/LlamaState.swift +189 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/ContentView.swift +145 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/DownloadButton.swift +2 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/InputButton.swift +131 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui.xcodeproj/project.pbxproj +6 -2
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/clip.cpp +24 -38
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main/main.cpp +11 -2
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/pydantic-models-to-grammar-examples.py +136 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/pydantic_models_to_grammar.py +1151 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize/quantize.cpp +132 -2
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/save-load-state/save-load-state.cpp +10 -11
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/README.md +6 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/server.cpp +241 -122
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-alloc.c +28 -6
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-alloc.h +3 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-backend-impl.h +19 -19
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-backend.c +476 -229
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-backend.h +35 -25
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-cuda.cu +894 -455
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-cuda.h +7 -19
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-impl.h +2 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/ggml-metal.h +64 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-metal.m +612 -776
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-metal.metal +374 -4
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-opencl.cpp +321 -14
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-opencl.h +13 -3
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-quants.c +1681 -27
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-quants.h +21 -2
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml.c +150 -58
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml.h +20 -12
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/constants.py +3 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/tensor_mapping.py +9 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/llama.cpp +1217 -1610
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/llama.h +32 -8
- llama_cpp_python-0.2.29/vendor/llama.cpp/scripts/compare-llama-bench.py +374 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/sync-ggml-am.sh +13 -1
- llama_cpp_python-0.2.29/vendor/llama.cpp/scripts/sync-ggml.last +1 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-backend-ops.cpp +21 -7
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-quantize-fns.cpp +3 -2
- llama_cpp_python-0.2.28/.git/FETCH_HEAD +0 -1
- llama_cpp_python-0.2.28/.git/HEAD +0 -1
- llama_cpp_python-0.2.28/.git/index +0 -0
- llama_cpp_python-0.2.28/.git/logs/HEAD +0 -1
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/FETCH_HEAD +0 -1
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/HEAD +0 -1
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/index +0 -0
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/logs/HEAD +0 -2
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/logs/refs/heads/master +0 -1
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/logs/refs/remotes/origin/HEAD +0 -1
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/objects/3b/a26ebd66b91510725fa32a6180452bf45abf89 +0 -0
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/objects/6e/fb8eb30e7025b168f3fda3ff83b9b386428ad6 +0 -0
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/objects/b2/6b6f72fcaad1b45661afb97e2551ecc2afa075 +0 -0
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/objects/pack/pack-51c0c02c987a3a975ed4edb03bbd1999de104e16.idx +0 -0
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/objects/pack/pack-51c0c02c987a3a975ed4edb03bbd1999de104e16.rev +0 -0
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/packed-refs +0 -2
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/refs/heads/master +0 -1
- llama_cpp_python-0.2.28/.git/modules/vendor/llama.cpp/shallow +0 -2
- llama_cpp_python-0.2.28/.git/objects/0c/3b2e0ef0eaaa91538814c8270822dd01c7b9b1 +0 -0
- llama_cpp_python-0.2.28/.git/objects/0e/f132b07175867c07ad06fa22ca6b95eca67b59 +0 -0
- llama_cpp_python-0.2.28/.git/objects/17/1f357f53b0de535157a2c9b4de04582784ec97 +0 -0
- llama_cpp_python-0.2.28/.git/objects/2e/24903c21db75253911a70039ac5622672db813 +0 -0
- llama_cpp_python-0.2.28/.git/objects/33/234fb5fc258e8c09a9626dbb299419c57cc399 +0 -0
- llama_cpp_python-0.2.28/.git/objects/34/6b4631ebd1f4af85e9988d4a528e00edba6375 +0 -0
- llama_cpp_python-0.2.28/.git/objects/44/b6d4a35d3caf0c65aef0a1c77ff0ab4077d405 +0 -0
- llama_cpp_python-0.2.28/.git/objects/50/61247a14e480ab1962c8ec8e5417557a12affb +0 -0
- llama_cpp_python-0.2.28/.git/objects/55/d08db5f514fb6847938e3d6489b99f737ba6e3 +0 -0
- llama_cpp_python-0.2.28/.git/objects/7c/819b0d699f4d334d8020bbd253d3f3f67b4abc +0 -0
- llama_cpp_python-0.2.28/.git/objects/8a/80063397bf2687cb3f4534710d607a5906c681 +0 -0
- llama_cpp_python-0.2.28/.git/objects/ab/d7b4cde5b5285a44472d8a760b5337c986c47b +0 -0
- llama_cpp_python-0.2.28/.git/objects/af/f397f476fb7773d0e89b0e8913c8b1f97ca3e4 +0 -0
- llama_cpp_python-0.2.28/.git/objects/b9/373b7ac641e6e9c8d8cc64951139205d91d8bc +0 -0
- llama_cpp_python-0.2.28/.git/objects/c8/4fd04498c2fb188ff7c2a59473035fc90eb990 +0 -0
- llama_cpp_python-0.2.28/.git/objects/ca/e7ebb7a833dafcd402a96bea3a9574f74f0ed5 +0 -0
- llama_cpp_python-0.2.28/.git/objects/eb/51c854fd5ee35f477dbdf46ced6f62448b7750 +0 -0
- llama_cpp_python-0.2.28/.git/objects/f0/159663d922a6a693b1f9aee335d8667ae7f39e +0 -0
- llama_cpp_python-0.2.28/.git/objects/f5/39ce179f4af1e6b26a8b64c39b6b13fb78d73e +0 -0
- llama_cpp_python-0.2.28/.git/refs/tags/v0.2.28 +0 -1
- llama_cpp_python-0.2.28/.git/shallow +0 -1
- llama_cpp_python-0.2.28/tests/test_grammar.py +0 -13
- llama_cpp_python-0.2.28/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Models/LlamaState.swift +0 -100
- llama_cpp_python-0.2.28/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/ContentView.swift +0 -138
- llama_cpp_python-0.2.28/vendor/llama.cpp/examples/metal/CMakeLists.txt +0 -4
- llama_cpp_python-0.2.28/vendor/llama.cpp/examples/metal/metal.cpp +0 -103
- llama_cpp_python-0.2.28/vendor/llama.cpp/ggml-metal.h +0 -115
- llama_cpp_python-0.2.28/vendor/llama.cpp/scripts/sync-ggml.last +0 -1
- llama_cpp_python-0.2.28/vendor/llama.cpp/spm-headers/ggml.h +0 -1
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.dockerignore +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/description +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/applypatch-msg.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/commit-msg.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/fsmonitor-watchman.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/post-update.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/pre-applypatch.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/pre-commit.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/pre-merge-commit.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/pre-push.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/pre-rebase.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/pre-receive.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/prepare-commit-msg.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/push-to-checkout.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/sendemail-validate.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/hooks/update.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/info/exclude +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/description +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/applypatch-msg.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/commit-msg.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/fsmonitor-watchman.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/post-update.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-applypatch.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-commit.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-merge-commit.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-push.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-rebase.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-receive.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/prepare-commit-msg.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/push-to-checkout.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/sendemail-validate.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/update.sample +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/info/exclude +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/refs/remotes/origin/HEAD +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/04/5856ea2ffe697ec33db1c1c989bd45cde5bb3d +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/04/7bc14424303575f73af90611fec827334f54e8 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/0d/870969f4b23bd92a09ec29134d3fb454d38bec +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/0e/2a907c0e40de1a432ee0cd2e3d01c634df1a37 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/0e/f7bd4a856ec728adc565133e808628ea5566a1 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/11/2a0f7872fa9244bf38729a2722dc5c08dec20c +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/11/b6d5c26e3f7157658952b8ec353e985d522fac +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/13/c5b6b0df5f67e80cbe584909b83777901265a1 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/19/9bd4ffbf88c68c98b52c05f388dfa92716f6b7 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/23/e37d4d40e5ec0bfd85b5e928834d58e2cf0da6 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/24/04228325d88c59b819acaedb20b15635f75df9 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/27/2e4767b47397d1529e6a2d01298144d9d746ba +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/27/a6b1e5042318f85dc99c9f24f4dd6fc472d242 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/29/03e0146d304bcacbfabfe71f171a2edc03043e +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/2c/c6fb02dcb3226c1ecf0fbed6453eb3acadeaa2 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/39/697bfc2538bd4558018d0d721d6d6028c4bb56 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/3a/1d7180d508818fe957923e00dcd8950938632d +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/3a/6457dcdfd47e764654bacae0ba8347976b645a +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/41/cc68ea2402cf682807649d841e7c0f4175db01 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/47/4503fdfc554d8caabee4f321a80427f8c7d696 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/4b/3189dd1a54be3bc416786ddf184dd047dc4b20 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/51/f357200f8b998031f4be924e11ed2ae4bf3fea +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/56/2410fe1a4c4093d62e1705933eaf66c6d99a2c +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/5b/51e98ce432974ff031367f8937babe755e3d73 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/5f/350ffe99abe7297b2839f36fd0eaeb98887805 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/60/bc7aef42aac0409cfdca666ad2ff6f516d7b5b +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/61/027ef99725c50b0891fdbf0bf263a33abe648f +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/68/7316b327ca038d26a338b3070a7d4698322515 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/74/7c6130e3cb1479d20e2013b1dd3db3379c2266 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/76/e26fbd106895fba52861f8ac1e11cc6ee2a307 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/79/5dad726ae91f330c56e49bc188080b5b3b5ba9 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/79/a9e67a1aee09c6d182f240ba5eef32feabcbce +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/7a/7b899ec7dd48d192cba14ac9c8e9df4233f7fb +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/7d/5498f9d2c49c1f731b47845d845f6c5e16a3d9 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/7d/6c970483161eaf43cfa9d50010c071d4953053 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/7e/df0975dc12ccc95ad14de085f07efe6d65c620 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/7e/e8f748eab47180cea09c0ad8e75c3b991b4af4 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/80/7b0f57a8a873e58ade0ff0f5b0bcf0ff66b7f9 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/82/e5c4487e57d6d59c901a73bdd2a9bc172fee7c +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/8b/d03f88a1895cbf3ef249e13df79ee0efda779d +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/8e/32d2c0edce725a47b5845463133919cd766a61 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/91/abb11fdf507883caeeb2d2958e1c65fb6cbdc1 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/99/32d6130f5552a9b85c8b15b4ac6bc26b1068ce +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/9d/0ec2f705618e591cfa8d6512cb9a96b3da75f1 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/9d/3d3559849603efda6f3c8181684e4d19e0ec79 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/a9/e51cdc1672134ec9af66c9eccf09f6da4ceccd +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/ac/82b8fbb81087ec9b3a72d9e377102a31b28d16 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/b1/f90b91594f496ad9f27b1a68584984f4b523d2 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/b2/e879ec4bfb319459dd5357313ef06158c7039f +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/b5/affaa9d6087f3888dd9eedea209bb214b6e135 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/b9/1632f5bc787c1404600c894a6a4126359747d8 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/bb/cbbe7d61558adde3cbfd0c7a63a67c27ed6d30 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/c5/4e4eb5ce2636abd78df46a7616cfe9196a1198 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/c8/5e73d2b657bb05ed99309615d67bac93d9f86e +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/ca/ebbb67fdb02a0a8897d4e4826ea046a9931f6f +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/cc/6a3a7252ea6e698614f0629d4bc040ab6ca717 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/cd/351ba33849dcf6af35b493f7405962fa1625d4 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/d3/329eec3bac6ce7e54c76b77ac9bf99fab0fe3f +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/d3/efb3a6fe1e001db62ec08e5d31ce1d08567045 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/da/c33b74dddf06fcfc01244044eebb102cfcea37 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/e2/13518b95011cb6ee783986624c3b6de8659f81 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/e4/1f375774e6945e445bfb179502b128fe22dda7 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/e6/9de29bb2d1d6434b8b29ae775ad8c2e48c5391 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/e9/30609ff5c479a1d5e12a8f3993582d421a6326 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/eb/0fb9662e690d0f9de4632cddd321b3f872a725 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/eb/9a2cfa9167df02f136502af79738c71363abfd +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/ef/1b2c0162e8edd321e2b9c1ce375d96f1f1d048 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/f0/827d762e852a21f6406c469300899d5f509b8f +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/f1/b8e9d154231932c4b7b9b59611626764e68632 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/f2/0813765a70679e8a063871c9ef75d75c65ccb6 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/fa/dfc5fb4fe6f5eb6d5d98b62519e374a5202b00 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/fc/25ff5160028dee3570249abc40cd57780bcca9 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/fc/ef8cd800ee8a265b146748d178cb56b5632bf3 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/fd/64c09b37947c97e58903ce570785c657d56722 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/fe/b0ed68d94eac48b844fd587ddfb808649716a1 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.git/objects/ff/3e950cd1110fe552912cea4c268c4023d2b737 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/dependabot.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/workflows/build-and-release.yaml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/workflows/build-docker.yaml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/workflows/publish-to-test.yaml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/workflows/publish.yaml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/workflows/test-pypi.yaml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.github/workflows/test.yaml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.gitignore +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.gitmodules +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/.readthedocs.yaml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/LICENSE.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/Makefile +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/cuda_simple/Dockerfile +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/open_llama/Dockerfile +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/open_llama/build.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/open_llama/hug_model.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/open_llama/start.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/open_llama/start_server.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/openblas_simple/Dockerfile +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/simple/Dockerfile +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docker/simple/run.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docs/api-reference.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docs/changelog.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docs/index.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docs/install/macos.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docs/requirements.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/docs/server.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/high_level_api/fastapi_server.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/high_level_api/high_level_api_embedding.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/high_level_api/high_level_api_inference.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/high_level_api/high_level_api_streaming.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/high_level_api/langchain_custom_llm.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/Chat.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/Miku.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/ReasonAct.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/low_level_api_llama_cpp.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/quantize.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/readme/low_level_api_llama_cpp.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/util.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/notebooks/Batching.ipynb +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/notebooks/Clients.ipynb +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/notebooks/Functions.ipynb +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/notebooks/Guidance.ipynb +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/notebooks/Multimodal.ipynb +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/notebooks/PerformanceTuning.ipynb +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/llama_chat_format.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/llama_types.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/llava_cpp.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/py.typed +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/__init__.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/__main__.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/app.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/cli.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/errors.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/llama_cpp/server/types.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/mkdocs.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/pyproject.toml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/tests/test_llama.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.clang-tidy +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/cloud-v-pipeline +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/full-cuda.Dockerfile +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/full-rocm.Dockerfile +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/full.Dockerfile +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/main-cuda.Dockerfile +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/main-rocm.Dockerfile +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/main.Dockerfile +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/apps.nix +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/devshells.nix +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/jetson-support.nix +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/nixpkgs-instances.nix +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/package.nix +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/scope.nix +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/tools.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.dockerignore +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.ecrc +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.editorconfig +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.flake8 +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.git +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/ISSUE_TEMPLATE/bug.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/ISSUE_TEMPLATE/enhancement.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/build.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/code-coverage.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/docker.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/editorconfig.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/gguf-publish.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/nix-publish-flake.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/python-check-requirements.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/python-lint.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/tidy-post.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/tidy-review.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/zig-build.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.pre-commit-config.yaml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/LICENSE +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/SHA256SUMS +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/awq-py/awq/apply_awq.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/awq-py/requirements.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/build.zig +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ci/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ci/run.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/cmake/FindSIMD.cmake +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/codecov.yml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/base64.hpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/build-info.cpp.in +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/console.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/console.h +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/grammar-parser.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/grammar-parser.h +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/log.h +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/sampling.h +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/stb_image.h +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/train.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/train.h +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert-llama-ggml-to-gguf.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert-lora-to-ggml.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert-persimmon-to-gguf.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/docs/BLIS.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/docs/llama-star/idea-arch.key +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/docs/llama-star/idea-arch.pdf +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/docs/token_generation_performance_tips.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/Miku.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/alpaca.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/baby-llama/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/baby-llama/baby-llama.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/base-translate.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched/batched.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched-bench/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched-bench/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/.gitignore +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/Makefile +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/Package.swift +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/Sources/main.swift +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/beam-search/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/beam-search/beam-search.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/benchmark/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat-13B.bat +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat-13B.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat-persistent.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat-vicuna.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/convert-llama2c-to-ggml/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/convert-llama2c-to-ggml/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/convert-llama2c-to-ggml/convert-llama2c-to-ggml.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/embedding/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/embedding/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/embedding/embedding.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/export-lora/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/export-lora/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/convert-finetune-checkpoint-to-gguf.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/finetune.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/finetune.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/gguf/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/gguf/gguf.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/gpt4all.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/infill/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/infill/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/infill/infill.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/graph.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/jeopardy.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/qasheet.csv +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/questions.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/json-schema-to-grammar.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama-bench/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama-bench/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/.gitignore +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.cpp.swift/LibLlama.swift +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Assets.xcassets/AppIcon.appiconset/Contents.json +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Assets.xcassets/Contents.json +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/LoadCustomButton.swift +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/llama_swiftuiApp.swift +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui.xcodeproj/project.xcworkspace/contents.xcworkspacedata +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui.xcodeproj/project.xcworkspace/xcshareddata/IDEWorkspaceChecks.plist +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.vim +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama2-13b.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama2.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/clip.h +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/convert-image-encoder-to-gguf.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/llava-cli.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/llava-surgery.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/llava.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/llava.h +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llm.vim +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookahead/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookahead/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookahead/lookahead.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookup/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookup/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookup/lookup.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main-cmake-pkg/.gitignore +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main-cmake-pkg/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main-cmake-pkg/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/make-ggml.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/parallel/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/parallel/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/parallel/parallel.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/passkey/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/passkey/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/passkey/passkey.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/perplexity/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/perplexity/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/perplexity/perplexity.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize-stats/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize-stats/quantize-stats.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/reason-act.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/save-load-state/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/api_like_OAI.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/chat-llama2.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/chat.mjs +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/chat.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/completion.js.hpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/deps.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/httplib.h +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/index.html.hpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/index.js.hpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/json-schema-to-grammar.mjs.hpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/json.hpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/public/completion.js +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/public/index.html +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/public/index.js +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/public/json-schema-to-grammar.mjs +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server-llama2-13B.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/simple/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/simple/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/simple/simple.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/speculative/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/speculative/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/speculative/speculative.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/tokenize/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/tokenize/tokenize.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/train-text-from-scratch/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/train-text-from-scratch/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/train-text-from-scratch/convert-train-checkpoint-to-gguf.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/train-text-from-scratch/train-text-from-scratch.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/flake.lock +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/flake.nix +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-mpi.c +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-mpi.h +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/LICENSE +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/examples/writer.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/__init__.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/gguf.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/gguf_reader.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/gguf_writer.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/py.typed +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/vocab.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/pyproject.toml +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/scripts/__init__.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/scripts/gguf-convert-endian.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/scripts/gguf-dump.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/scripts/gguf-set-metadata.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/tests/test_gguf.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/README.md +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/arithmetic.gbnf +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/c.gbnf +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/chess.gbnf +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/japanese.gbnf +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/json.gbnf +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/json_arr.gbnf +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/list.gbnf +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama-leader.jpeg +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama0-banner.png +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama0-logo.png +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama1-banner.png +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama1-logo.png +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/mypy.ini +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/pocs/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/pocs/vdot/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/pocs/vdot/q8dot.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/pocs/vdot/vdot.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/LLM-questions.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/alpaca.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/assistant.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-baichuan.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-bob.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-qwen.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-vicuna-v0.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-vicuna-v1.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/dan-modified.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/dan.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/mnemonics.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/parallel-questions.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/reason-act.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert-hf-to-gguf.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert-llama-ggml-to-gguf.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert-lora-to-ggml.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert-persimmon-to-gguf.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/run_with_preset.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/LlamaConfig.cmake.in +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/build-info.cmake +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/build-info.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/check-requirements.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/convert-gg.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/gen-build-info-cpp.cmake +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/get-flags.mk +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/get-pg.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/get-wikitext-2.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/qnt-all.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/run-all-perf.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/run-all-ppl.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/server-llm.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/sync-ggml.sh +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/verify-checksum-models.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/spm-headers/llama.h +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-c.c +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-double-float.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-grad0.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-grammar-parser.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-llama-grammar.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-opt.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-quantize-perf.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-rope.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-sampling.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-0-falcon.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-0-falcon.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-0-llama.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-0-llama.py +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-1-bpe.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-1-llama.cpp +0 -0
- {llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/vendor/llama.cpp/unicode.h +0 -0
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4b11fa83c00a3c04cfb47775ffcd226167d52044 '4b11fa83c00a3c04cfb47775ffcd226167d52044' of https://github.com/abetlen/llama-cpp-python
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4b11fa83c00a3c04cfb47775ffcd226167d52044
|
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
[gc]
|
|
10
10
|
auto = 0
|
|
11
11
|
[http "https://github.com/"]
|
|
12
|
-
extraheader = AUTHORIZATION: basic
|
|
12
|
+
extraheader = AUTHORIZATION: basic eC1hY2Nlc3MtdG9rZW46Z2hzXzg0QXZkVFUxdjRsWmlJSlFjZHVISHVlZnBtUnA3STFDcUxkeA==
|
|
13
13
|
[submodule "vendor/llama.cpp"]
|
|
14
14
|
active = true
|
|
15
15
|
url = https://github.com/ggerganov/llama.cpp.git
|
|
Binary file
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
0000000000000000000000000000000000000000 4b11fa83c00a3c04cfb47775ffcd226167d52044 runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341384 +0000 checkout: moving from master to refs/tags/v0.2.29
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4483396751c79dea540808b9cb9238245d06da2b
|
|
@@ -13,7 +13,7 @@
|
|
|
13
13
|
[gc]
|
|
14
14
|
auto = 0
|
|
15
15
|
[http "https://github.com/"]
|
|
16
|
-
extraheader = AUTHORIZATION: basic
|
|
16
|
+
extraheader = AUTHORIZATION: basic eC1hY2Nlc3MtdG9rZW46Z2hzXzg0QXZkVFUxdjRsWmlJSlFjZHVISHVlZnBtUnA3STFDcUxkeA==
|
|
17
17
|
[url "https://github.com/"]
|
|
18
18
|
insteadOf = git@github.com:
|
|
19
19
|
insteadOf = org-6826477@github.com:
|
|
Binary file
|
|
@@ -0,0 +1,2 @@
|
|
|
1
|
+
0000000000000000000000000000000000000000 4483396751c79dea540808b9cb9238245d06da2b runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341385 +0000 clone: from https://github.com/ggerganov/llama.cpp.git
|
|
2
|
+
4483396751c79dea540808b9cb9238245d06da2b 4483396751c79dea540808b9cb9238245d06da2b runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341385 +0000 checkout: moving from master to 4483396751c79dea540808b9cb9238245d06da2b
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
0000000000000000000000000000000000000000 4483396751c79dea540808b9cb9238245d06da2b runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341385 +0000 clone: from https://github.com/ggerganov/llama.cpp.git
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
0000000000000000000000000000000000000000 4483396751c79dea540808b9cb9238245d06da2b runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341385 +0000 clone: from https://github.com/ggerganov/llama.cpp.git
|
|
Binary file
|
|
Binary file
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4483396751c79dea540808b9cb9238245d06da2b
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4483396751c79dea540808b9cb9238245d06da2b
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4483396751c79dea540808b9cb9238245d06da2b
|
|
@@ -0,0 +1,2 @@
|
|
|
1
|
+
x}TM��0�Y�bPj��%�[ ��K�S��R�lM-��J����w4�Xg7�A���潑�u5���w�띏ж�SU��b,<g��� �-�=l6�)��N#o��d&�k�#s)�s��"���1���U�)_������,��g���Ζ�O��ǁS,9�^�4R��]T��l���& D�#�*c5�J��[�ɐ �0�gq�q4�����Z�h�)�(EO��o�@0Ny�~���1MK9����8��W06.q��JK�z �%AZ���戝��y��wV���!R;�R�mU�g,Xz����#�2jN֥8������Dճ3�Q{�i��<�&��{�,��5 r�(���M�˽w=��A�H�P2��"�d)�A�s�����~�4�#=�<�eM����d��V`���'
|
|
2
|
+
.�����-����3��O9V<��R.�����n~1����L����_�H���y�W9/�{9ݕ�_��i����ҺЧ��P��A�Յ�����/]�X%
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4b11fa83c00a3c04cfb47775ffcd226167d52044
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4b11fa83c00a3c04cfb47775ffcd226167d52044
|
|
@@ -7,6 +7,15 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
|
|
|
7
7
|
|
|
8
8
|
## [Unreleased]
|
|
9
9
|
|
|
10
|
+
## [0.2.29]
|
|
11
|
+
|
|
12
|
+
- feat: Update llama.cpp to ggerganov/llama.cpp@4483396751c79dea540808b9cb9238245d06da2b
|
|
13
|
+
- feat: Add split_mode option by @abetlen in 84615adbc6855c8384807c42f0130f9a1763f99d
|
|
14
|
+
- feat: Implement GGUF metadata KV overrides by @phiharri in #1011
|
|
15
|
+
- fix: Avoid "LookupError: unknown encoding: ascii" when open() called in a destructor by @yieldthought in #1012
|
|
16
|
+
- fix: Fix low_level_api_chat_cpp example to match current API by @aniljava in #1086
|
|
17
|
+
- fix: Fix Pydantic model parsing by @DeNeutoy in #1087
|
|
18
|
+
|
|
10
19
|
## [0.2.28]
|
|
11
20
|
|
|
12
21
|
- feat: Update llama.cpp to ggerganov/llama.cpp@6efb8eb30e7025b168f3fda3ff83b9b386428ad6
|
|
@@ -106,7 +106,7 @@ def gpt_params_parse(argv = None):
|
|
|
106
106
|
parser.add_argument("--mirostat_lr", type=float, default=0.1, help="Mirostat learning rate, parameter eta",dest="mirostat_eta")
|
|
107
107
|
|
|
108
108
|
parser.add_argument("-m", "--model", type=str, default="./models/llama-7B/ggml-model.bin", help="model path",dest="model")
|
|
109
|
-
parser.add_argument("-p", "--prompt", type=str, default=
|
|
109
|
+
parser.add_argument("-p", "--prompt", type=str, default=None, help="initial prompt",dest="prompt")
|
|
110
110
|
parser.add_argument("-f", "--file", type=str, default=None, help="file containing initial prompt to load",dest="file")
|
|
111
111
|
parser.add_argument("--session", type=str, default=None, help="file to cache model state in (may be large!)",dest="path_session")
|
|
112
112
|
parser.add_argument("--in-prefix", type=str, default="", help="string to prefix user inputs with", dest="input_prefix")
|
{llama_cpp_python-0.2.28 → llama_cpp_python-0.2.29}/examples/low_level_api/low_level_api_chat_cpp.py
RENAMED
|
@@ -62,7 +62,7 @@ specified) expect poor results""", file=sys.stderr)
|
|
|
62
62
|
self.multibyte_fix = []
|
|
63
63
|
|
|
64
64
|
# model load
|
|
65
|
-
self.lparams = llama_cpp.
|
|
65
|
+
self.lparams = llama_cpp.llama_model_default_params()
|
|
66
66
|
self.lparams.n_ctx = self.params.n_ctx
|
|
67
67
|
self.lparams.n_parts = self.params.n_parts
|
|
68
68
|
self.lparams.seed = self.params.seed
|
|
@@ -72,7 +72,11 @@ specified) expect poor results""", file=sys.stderr)
|
|
|
72
72
|
|
|
73
73
|
self.model = llama_cpp.llama_load_model_from_file(
|
|
74
74
|
self.params.model.encode("utf8"), self.lparams)
|
|
75
|
-
|
|
75
|
+
|
|
76
|
+
# Context Params.
|
|
77
|
+
self.cparams = llama_cpp.llama_context_default_params()
|
|
78
|
+
|
|
79
|
+
self.ctx = llama_cpp.llama_new_context_with_model(self.model, self.cparams)
|
|
76
80
|
if (not self.ctx):
|
|
77
81
|
raise RuntimeError(f"error: failed to load model '{self.params.model}'")
|
|
78
82
|
|
|
@@ -244,7 +248,7 @@ n_keep = {self.params.n_keep}
|
|
|
244
248
|
# tokenize a prompt
|
|
245
249
|
def _tokenize(self, prompt, bos=True):
|
|
246
250
|
_arr = (llama_cpp.llama_token * ((len(prompt) + 1) * 4))()
|
|
247
|
-
_n = llama_cpp.llama_tokenize(self.
|
|
251
|
+
_n = llama_cpp.llama_tokenize(self.model, prompt.encode("utf8", errors="ignore"), len(prompt), _arr, len(_arr), bos, False)
|
|
248
252
|
return _arr[:_n]
|
|
249
253
|
|
|
250
254
|
def set_color(self, c):
|
|
@@ -304,7 +308,7 @@ n_keep = {self.params.n_keep}
|
|
|
304
308
|
self.n_past += n_eval"""
|
|
305
309
|
|
|
306
310
|
if (llama_cpp.llama_eval(
|
|
307
|
-
self.ctx, (llama_cpp.llama_token * len(self.embd))(*self.embd), len(self.embd), self.n_past
|
|
311
|
+
self.ctx, (llama_cpp.llama_token * len(self.embd))(*self.embd), len(self.embd), self.n_past
|
|
308
312
|
) != 0):
|
|
309
313
|
raise Exception("Failed to llama_eval!")
|
|
310
314
|
|
|
@@ -332,7 +336,7 @@ n_keep = {self.params.n_keep}
|
|
|
332
336
|
id = 0
|
|
333
337
|
|
|
334
338
|
logits = llama_cpp.llama_get_logits(self.ctx)
|
|
335
|
-
n_vocab = llama_cpp.llama_n_vocab(self.
|
|
339
|
+
n_vocab = llama_cpp.llama_n_vocab(self.model)
|
|
336
340
|
|
|
337
341
|
# Apply params.logit_bias map
|
|
338
342
|
for key, value in self.params.logit_bias.items():
|
|
@@ -349,12 +353,20 @@ n_keep = {self.params.n_keep}
|
|
|
349
353
|
last_n_repeat = min(len(self.last_n_tokens), repeat_last_n, self.n_ctx)
|
|
350
354
|
|
|
351
355
|
_arr = (llama_cpp.llama_token * last_n_repeat)(*self.last_n_tokens[len(self.last_n_tokens) - last_n_repeat:])
|
|
352
|
-
llama_cpp.
|
|
353
|
-
|
|
354
|
-
|
|
355
|
-
|
|
356
|
-
|
|
357
|
-
|
|
356
|
+
llama_cpp.llama_sample_repetition_penalties(
|
|
357
|
+
ctx=self.ctx,
|
|
358
|
+
candidates=candidates_p,
|
|
359
|
+
last_tokens_data = _arr,
|
|
360
|
+
penalty_last_n = last_n_repeat,
|
|
361
|
+
penalty_repeat = llama_cpp.c_float(self.params.repeat_penalty),
|
|
362
|
+
penalty_freq = llama_cpp.c_float(self.params.frequency_penalty),
|
|
363
|
+
penalty_present = llama_cpp.c_float(self.params.presence_penalty),
|
|
364
|
+
)
|
|
365
|
+
|
|
366
|
+
# NOT PRESENT IN CURRENT VERSION ?
|
|
367
|
+
# llama_cpp.llama_sample_frequency_and_presence_penalti(self.ctx, candidates_p,
|
|
368
|
+
# _arr,
|
|
369
|
+
# last_n_repeat, llama_cpp.c_float(self.params.frequency_penalty), llama_cpp.c_float(self.params.presence_penalty))
|
|
358
370
|
|
|
359
371
|
if not self.params.penalize_nl:
|
|
360
372
|
logits[llama_cpp.llama_token_nl()] = nl_logit
|
|
@@ -473,7 +485,7 @@ n_keep = {self.params.n_keep}
|
|
|
473
485
|
def token_to_str(self, token_id: int) -> bytes:
|
|
474
486
|
size = 32
|
|
475
487
|
buffer = (ctypes.c_char * size)()
|
|
476
|
-
n = llama_cpp.
|
|
488
|
+
n = llama_cpp.llama_token_to_piece(
|
|
477
489
|
self.model, llama_cpp.llama_token(token_id), buffer, size)
|
|
478
490
|
assert n <= size
|
|
479
491
|
return bytes(buffer[:n])
|
|
@@ -532,6 +544,9 @@ n_keep = {self.params.n_keep}
|
|
|
532
544
|
print(i,end="",flush=True)
|
|
533
545
|
self.params.input_echo = False
|
|
534
546
|
|
|
547
|
+
# Using string instead of tokens to check for antiprompt,
|
|
548
|
+
# It is more reliable than tokens for interactive mode.
|
|
549
|
+
generated_str = ""
|
|
535
550
|
while self.params.interactive:
|
|
536
551
|
self.set_color(util.CONSOLE_COLOR_USER_INPUT)
|
|
537
552
|
if (self.params.instruct):
|
|
@@ -546,6 +561,10 @@ n_keep = {self.params.n_keep}
|
|
|
546
561
|
try:
|
|
547
562
|
for i in self.output():
|
|
548
563
|
print(i,end="",flush=True)
|
|
564
|
+
generated_str += i
|
|
565
|
+
for ap in self.params.antiprompt:
|
|
566
|
+
if generated_str.endswith(ap):
|
|
567
|
+
raise KeyboardInterrupt
|
|
549
568
|
except KeyboardInterrupt:
|
|
550
569
|
self.set_color(util.CONSOLE_COLOR_DEFAULT)
|
|
551
570
|
if not self.params.instruct:
|
|
@@ -561,7 +580,7 @@ if __name__ == "__main__":
|
|
|
561
580
|
time_now = datetime.now()
|
|
562
581
|
prompt = f"""Text transcript of a never ending dialog, where {USER_NAME} interacts with an AI assistant named {AI_NAME}.
|
|
563
582
|
{AI_NAME} is helpful, kind, honest, friendly, good at writing and never fails to answer {USER_NAME}’s requests immediately and with details and precision.
|
|
564
|
-
|
|
583
|
+
Transcript below contains only the recorded dialog between two, without any annotations like (30 seconds passed...) or (to himself), just what {USER_NAME} and {AI_NAME} say aloud to each other.
|
|
565
584
|
The dialog lasts for years, the entirety of it is shared below. It's 10000 pages long.
|
|
566
585
|
The transcript only includes text, it does not include markup like HTML and Markdown.
|
|
567
586
|
|
|
@@ -575,8 +594,11 @@ The transcript only includes text, it does not include markup like HTML and Mark
|
|
|
575
594
|
{AI_NAME}: A cat is a domestic species of small carnivorous mammal. It is the only domesticated species in the family Felidae.
|
|
576
595
|
{USER_NAME}: Name a color.
|
|
577
596
|
{AI_NAME}: Blue
|
|
578
|
-
{USER_NAME}:"""
|
|
597
|
+
{USER_NAME}: """
|
|
598
|
+
|
|
579
599
|
params = gpt_params_parse()
|
|
600
|
+
if params.prompt is None and params.file is None:
|
|
601
|
+
params.prompt = prompt
|
|
580
602
|
|
|
581
603
|
with LLaMAInteract(params) as m:
|
|
582
604
|
m.interact()
|
|
@@ -1,11 +1,15 @@
|
|
|
1
1
|
import os
|
|
2
2
|
import sys
|
|
3
3
|
|
|
4
|
+
import sys, traceback
|
|
5
|
+
|
|
6
|
+
# Avoid "LookupError: unknown encoding: ascii" when open() called in a destructor
|
|
7
|
+
outnull_file = open(os.devnull, "w")
|
|
8
|
+
errnull_file = open(os.devnull, "w")
|
|
4
9
|
|
|
5
10
|
class suppress_stdout_stderr(object):
|
|
6
11
|
# NOTE: these must be "saved" here to avoid exceptions when using
|
|
7
12
|
# this context manager inside of a __del__ method
|
|
8
|
-
open = open
|
|
9
13
|
sys = sys
|
|
10
14
|
os = os
|
|
11
15
|
|
|
@@ -21,9 +25,6 @@ class suppress_stdout_stderr(object):
|
|
|
21
25
|
if not hasattr(self.sys.stdout, 'fileno') or not hasattr(self.sys.stderr, 'fileno'):
|
|
22
26
|
return self # Return the instance without making changes
|
|
23
27
|
|
|
24
|
-
self.outnull_file = self.open(self.os.devnull, "w")
|
|
25
|
-
self.errnull_file = self.open(self.os.devnull, "w")
|
|
26
|
-
|
|
27
28
|
self.old_stdout_fileno_undup = self.sys.stdout.fileno()
|
|
28
29
|
self.old_stderr_fileno_undup = self.sys.stderr.fileno()
|
|
29
30
|
|
|
@@ -33,11 +34,11 @@ class suppress_stdout_stderr(object):
|
|
|
33
34
|
self.old_stdout = self.sys.stdout
|
|
34
35
|
self.old_stderr = self.sys.stderr
|
|
35
36
|
|
|
36
|
-
self.os.dup2(
|
|
37
|
-
self.os.dup2(
|
|
37
|
+
self.os.dup2(outnull_file.fileno(), self.old_stdout_fileno_undup)
|
|
38
|
+
self.os.dup2(errnull_file.fileno(), self.old_stderr_fileno_undup)
|
|
38
39
|
|
|
39
|
-
self.sys.stdout =
|
|
40
|
-
self.sys.stderr =
|
|
40
|
+
self.sys.stdout = outnull_file
|
|
41
|
+
self.sys.stderr = errnull_file
|
|
41
42
|
return self
|
|
42
43
|
|
|
43
44
|
def __exit__(self, *_):
|
|
@@ -54,6 +55,3 @@ class suppress_stdout_stderr(object):
|
|
|
54
55
|
|
|
55
56
|
self.os.close(self.old_stdout_fileno)
|
|
56
57
|
self.os.close(self.old_stderr_fileno)
|
|
57
|
-
|
|
58
|
-
self.outnull_file.close()
|
|
59
|
-
self.errnull_file.close()
|
|
@@ -730,11 +730,13 @@ class Llama:
|
|
|
730
730
|
*,
|
|
731
731
|
# Model Params
|
|
732
732
|
n_gpu_layers: int = 0,
|
|
733
|
+
split_mode: int = llama_cpp.LLAMA_SPLIT_LAYER,
|
|
733
734
|
main_gpu: int = 0,
|
|
734
735
|
tensor_split: Optional[List[float]] = None,
|
|
735
736
|
vocab_only: bool = False,
|
|
736
737
|
use_mmap: bool = True,
|
|
737
738
|
use_mlock: bool = False,
|
|
739
|
+
kv_overrides: Optional[Dict[str, Union[bool, int, float]]] = None,
|
|
738
740
|
# Context Params
|
|
739
741
|
seed: int = llama_cpp.LLAMA_DEFAULT_SEED,
|
|
740
742
|
n_ctx: int = 512,
|
|
@@ -798,11 +800,13 @@ class Llama:
|
|
|
798
800
|
Args:
|
|
799
801
|
model_path: Path to the model.
|
|
800
802
|
n_gpu_layers: Number of layers to offload to GPU (-ngl). If -1, all layers are offloaded.
|
|
801
|
-
|
|
803
|
+
split_mode: How to split the model across GPUs. See llama_cpp.LLAMA_SPLIT_* for options.
|
|
804
|
+
main_gpu: main_gpu interpretation depends on split_mode: LLAMA_SPLIT_NONE: the GPU that is used for the entire model. LLAMA_SPLIT_ROW: the GPU that is used for small tensors and intermediate results. LLAMA_SPLIT_LAYER: ignored
|
|
802
805
|
tensor_split: How split tensors should be distributed across GPUs. If None, the model is not split.
|
|
803
806
|
vocab_only: Only load the vocabulary no weights.
|
|
804
807
|
use_mmap: Use mmap if possible.
|
|
805
808
|
use_mlock: Force the system to keep the model in RAM.
|
|
809
|
+
kv_overrides: Key-value overrides for the model.
|
|
806
810
|
seed: RNG seed, -1 for random
|
|
807
811
|
n_ctx: Text context, 0 = from model
|
|
808
812
|
n_batch: Prompt processing maximum batch size
|
|
@@ -848,6 +852,7 @@ class Llama:
|
|
|
848
852
|
self.model_params.n_gpu_layers = (
|
|
849
853
|
0x7FFFFFFF if n_gpu_layers == -1 else n_gpu_layers
|
|
850
854
|
) # 0x7FFFFFFF is INT32 max, will be auto set to all layers
|
|
855
|
+
self.model_params.split_mode = split_mode
|
|
851
856
|
self.model_params.main_gpu = main_gpu
|
|
852
857
|
self.tensor_split = tensor_split
|
|
853
858
|
self._c_tensor_split = None
|
|
@@ -866,6 +871,34 @@ class Llama:
|
|
|
866
871
|
self.model_params.use_mmap = use_mmap if lora_path is None else False
|
|
867
872
|
self.model_params.use_mlock = use_mlock
|
|
868
873
|
|
|
874
|
+
self.kv_overrides = kv_overrides
|
|
875
|
+
if kv_overrides is not None:
|
|
876
|
+
n_overrides = len(kv_overrides)
|
|
877
|
+
self._kv_overrides_array = llama_cpp.llama_model_kv_override * (n_overrides + 1)
|
|
878
|
+
self._kv_overrides_array_keys = []
|
|
879
|
+
|
|
880
|
+
for k, v in kv_overrides.items():
|
|
881
|
+
key_buf = ctypes.create_string_buffer(k.encode("utf-8"))
|
|
882
|
+
self._kv_overrides_array_keys.append(key_buf)
|
|
883
|
+
self._kv_overrides_array[i].key = key_buf
|
|
884
|
+
if isinstance(v, int):
|
|
885
|
+
self._kv_overrides_array[i].tag = llama_cpp.LLAMA_KV_OVERRIDE_INT
|
|
886
|
+
self._kv_overrides_array[i].value.int_value = v
|
|
887
|
+
elif isinstance(v, float):
|
|
888
|
+
self._kv_overrides_array[i].tag = llama_cpp.LLAMA_KV_OVERRIDE_FLOAT
|
|
889
|
+
self._kv_overrides_array[i].value.float_value = v
|
|
890
|
+
elif isinstance(v, bool):
|
|
891
|
+
self._kv_overrides_array[i].tag = llama_cpp.LLAMA_KV_OVERRIDE_BOOL
|
|
892
|
+
self._kv_overrides_array[i].value.bool_value = v
|
|
893
|
+
else:
|
|
894
|
+
raise ValueError(f"Unknown value type for {k}: {v}")
|
|
895
|
+
|
|
896
|
+
self._kv_overrides_array_sentinel_key = b'\0'
|
|
897
|
+
|
|
898
|
+
# null array sentinel
|
|
899
|
+
self._kv_overrides_array[n_overrides].key = self._kv_overrides_array_sentinel_key
|
|
900
|
+
self.model_params.kv_overrides = self._kv_overrides_array
|
|
901
|
+
|
|
869
902
|
self.n_batch = min(n_ctx, n_batch) # ???
|
|
870
903
|
self.n_threads = n_threads or max(multiprocessing.cpu_count() // 2, 1)
|
|
871
904
|
self.n_threads_batch = n_threads_batch or max(
|
|
@@ -2143,11 +2176,13 @@ class Llama:
|
|
|
2143
2176
|
model_path=self.model_path,
|
|
2144
2177
|
# Model Params
|
|
2145
2178
|
n_gpu_layers=self.model_params.n_gpu_layers,
|
|
2179
|
+
split_mode=self.model_params.split_mode,
|
|
2146
2180
|
main_gpu=self.model_params.main_gpu,
|
|
2147
2181
|
tensor_split=self.tensor_split,
|
|
2148
2182
|
vocab_only=self.model_params.vocab_only,
|
|
2149
2183
|
use_mmap=self.model_params.use_mmap,
|
|
2150
2184
|
use_mlock=self.model_params.use_mlock,
|
|
2185
|
+
kv_overrides=self.kv_overrides,
|
|
2151
2186
|
# Context Params
|
|
2152
2187
|
seed=self.context_params.seed,
|
|
2153
2188
|
n_ctx=self.context_params.n_ctx,
|
|
@@ -2185,11 +2220,13 @@ class Llama:
|
|
|
2185
2220
|
model_path=state["model_path"],
|
|
2186
2221
|
# Model Params
|
|
2187
2222
|
n_gpu_layers=state["n_gpu_layers"],
|
|
2223
|
+
split_mode=state["split_mode"],
|
|
2188
2224
|
main_gpu=state["main_gpu"],
|
|
2189
2225
|
tensor_split=state["tensor_split"],
|
|
2190
2226
|
vocab_only=state["vocab_only"],
|
|
2191
2227
|
use_mmap=state["use_mmap"],
|
|
2192
2228
|
use_mlock=state["use_mlock"],
|
|
2229
|
+
kv_overrides=state["kv_overrides"],
|
|
2193
2230
|
# Context Params
|
|
2194
2231
|
seed=state["seed"],
|
|
2195
2232
|
n_ctx=state["n_ctx"],
|
|
@@ -112,8 +112,8 @@ LLAMA_FILE_MAGIC_GGSN = 0x6767736E
|
|
|
112
112
|
|
|
113
113
|
# define LLAMA_SESSION_MAGIC LLAMA_FILE_MAGIC_GGSN
|
|
114
114
|
LLAMA_SESSION_MAGIC = LLAMA_FILE_MAGIC_GGSN
|
|
115
|
-
# define LLAMA_SESSION_VERSION
|
|
116
|
-
LLAMA_SESSION_VERSION =
|
|
115
|
+
# define LLAMA_SESSION_VERSION 4
|
|
116
|
+
LLAMA_SESSION_VERSION = 4
|
|
117
117
|
|
|
118
118
|
|
|
119
119
|
# struct llama_model;
|
|
@@ -180,6 +180,8 @@ LLAMA_TOKEN_TYPE_BYTE = 6
|
|
|
180
180
|
# LLAMA_FTYPE_MOSTLY_Q5_K_M = 17, // except 1d tensors
|
|
181
181
|
# LLAMA_FTYPE_MOSTLY_Q6_K = 18, // except 1d tensors
|
|
182
182
|
# LLAMA_FTYPE_MOSTLY_IQ2_XXS = 19, // except 1d tensors
|
|
183
|
+
# LLAMA_FTYPE_MOSTLY_IQ2_XS = 20, // except 1d tensors
|
|
184
|
+
# LLAMA_FTYPE_MOSTLY_Q2_K_S = 21, // except 1d tensors
|
|
183
185
|
|
|
184
186
|
# LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
|
|
185
187
|
# };
|
|
@@ -200,6 +202,9 @@ LLAMA_FTYPE_MOSTLY_Q4_K_M = 15
|
|
|
200
202
|
LLAMA_FTYPE_MOSTLY_Q5_K_S = 16
|
|
201
203
|
LLAMA_FTYPE_MOSTLY_Q5_K_M = 17
|
|
202
204
|
LLAMA_FTYPE_MOSTLY_Q6_K = 18
|
|
205
|
+
LLAMA_FTYPE_MOSTLY_IQ2_XXS = 19
|
|
206
|
+
LLAMA_FTYPE_MOSTLY_IQ2_XS = 20
|
|
207
|
+
LLAMA_FTYPE_MOSTLY_Q2_K_S = 21
|
|
203
208
|
LLAMA_FTYPE_GUESSED = 1024
|
|
204
209
|
|
|
205
210
|
# enum llama_rope_scaling_type {
|
|
@@ -215,6 +220,15 @@ LLAMA_ROPE_SCALING_LINEAR = 1
|
|
|
215
220
|
LLAMA_ROPE_SCALING_YARN = 2
|
|
216
221
|
LLAMA_ROPE_SCALING_MAX_VALUE = LLAMA_ROPE_SCALING_YARN
|
|
217
222
|
|
|
223
|
+
# enum llama_split_mode {
|
|
224
|
+
# LLAMA_SPLIT_NONE = 0, // single GPU
|
|
225
|
+
# LLAMA_SPLIT_LAYER = 1, // split layers and KV across GPUs
|
|
226
|
+
# LLAMA_SPLIT_ROW = 2, // split rows across GPUs
|
|
227
|
+
# };
|
|
228
|
+
LLAMA_SPLIT_NONE = 0
|
|
229
|
+
LLAMA_SPLIT_LAYER = 1
|
|
230
|
+
LLAMA_SPLIT_ROW = 2
|
|
231
|
+
|
|
218
232
|
|
|
219
233
|
# typedef struct llama_token_data {
|
|
220
234
|
# llama_token id; // token id
|
|
@@ -360,13 +374,22 @@ class llama_model_kv_override(Structure):
|
|
|
360
374
|
|
|
361
375
|
# struct llama_model_params {
|
|
362
376
|
# int32_t n_gpu_layers; // number of layers to store in VRAM
|
|
363
|
-
#
|
|
364
|
-
|
|
377
|
+
# enum llama_split_mode split_mode; // how to split the model across multiple GPUs
|
|
378
|
+
|
|
379
|
+
# // main_gpu interpretation depends on split_mode:
|
|
380
|
+
# // LLAMA_SPLIT_NONE: the GPU that is used for the entire model
|
|
381
|
+
# // LLAMA_SPLIT_ROW: the GPU that is used for small tensors and intermediate results
|
|
382
|
+
# // LLAMA_SPLIT_LAYER: ignored
|
|
383
|
+
# int32_t main_gpu;
|
|
384
|
+
|
|
385
|
+
# // proportion of the model (layers or rows) to offload to each GPU, size: LLAMA_MAX_DEVICES
|
|
386
|
+
# const float * tensor_split;
|
|
365
387
|
|
|
366
388
|
# // Called with a progress value between 0.0 and 1.0. Pass NULL to disable.
|
|
367
389
|
# // If the provided progress_callback returns true, model loading continues.
|
|
368
390
|
# // If it returns false, model loading is immediately aborted.
|
|
369
391
|
# llama_progress_callback progress_callback;
|
|
392
|
+
|
|
370
393
|
# // context pointer passed to the progress callback
|
|
371
394
|
# void * progress_callback_user_data;
|
|
372
395
|
|
|
@@ -384,8 +407,9 @@ class llama_model_params(Structure):
|
|
|
384
407
|
|
|
385
408
|
Attributes:
|
|
386
409
|
n_gpu_layers (int): number of layers to store in VRAM
|
|
387
|
-
|
|
388
|
-
|
|
410
|
+
split_mode (int): how to split the model across multiple GPUs
|
|
411
|
+
main_gpu (int): the GPU that is used for the entire model. main_gpu interpretation depends on split_mode: LLAMA_SPLIT_NONE: the GPU that is used for the entire model LLAMA_SPLIT_ROW: the GPU that is used for small tensors and intermediate results LLAMA_SPLIT_LAYER: ignored
|
|
412
|
+
tensor_split (ctypes.Array[ctypes.c_float]): proportion of the model (layers or rows) to offload to each GPU, size: LLAMA_MAX_DEVICES
|
|
389
413
|
progress_callback (llama_progress_callback): called with a progress value between 0.0 and 1.0. Pass NULL to disable. If the provided progress_callback returns true, model loading continues. If it returns false, model loading is immediately aborted.
|
|
390
414
|
progress_callback_user_data (ctypes.c_void_p): context pointer passed to the progress callback
|
|
391
415
|
kv_overrides (ctypes.Array[llama_model_kv_override]): override key-value pairs of the model meta data
|
|
@@ -395,6 +419,7 @@ class llama_model_params(Structure):
|
|
|
395
419
|
|
|
396
420
|
_fields_ = [
|
|
397
421
|
("n_gpu_layers", c_int32),
|
|
422
|
+
("split_mode", c_int),
|
|
398
423
|
("main_gpu", c_int32),
|
|
399
424
|
("tensor_split", c_float_p),
|
|
400
425
|
("progress_callback", llama_progress_callback),
|
|
@@ -503,6 +528,7 @@ It might not exist for progress report where '.' is output repeatedly."""
|
|
|
503
528
|
# bool quantize_output_tensor; // quantize output.weight
|
|
504
529
|
# bool only_copy; // only copy tensors - ftype, allow_requantize and quantize_output_tensor are ignored
|
|
505
530
|
# bool pure; // disable k-quant mixtures and quantize all tensors to the same type
|
|
531
|
+
# void * imatrix; // pointer to importance matrix data
|
|
506
532
|
# } llama_model_quantize_params;
|
|
507
533
|
class llama_model_quantize_params(Structure):
|
|
508
534
|
"""Parameters for llama_model_quantize
|
|
@@ -514,6 +540,7 @@ class llama_model_quantize_params(Structure):
|
|
|
514
540
|
quantize_output_tensor (bool): quantize output.weight
|
|
515
541
|
only_copy (bool): only copy tensors - ftype, allow_requantize and quantize_output_tensor are ignored
|
|
516
542
|
pure (bool): disable k-quant mixtures and quantize all tensors to the same type
|
|
543
|
+
imatrix (ctypes.c_void_p): pointer to importance matrix data
|
|
517
544
|
"""
|
|
518
545
|
|
|
519
546
|
_fields_ = [
|
|
@@ -522,6 +549,8 @@ class llama_model_quantize_params(Structure):
|
|
|
522
549
|
("allow_requantize", c_bool),
|
|
523
550
|
("quantize_output_tensor", c_bool),
|
|
524
551
|
("only_copy", c_bool),
|
|
552
|
+
("pure", c_bool),
|
|
553
|
+
("imatrix", c_void_p),
|
|
525
554
|
]
|
|
526
555
|
|
|
527
556
|
|
|
@@ -1933,14 +1962,39 @@ _lib.llama_sample_repetition_penalties.restype = None
|
|
|
1933
1962
|
|
|
1934
1963
|
|
|
1935
1964
|
# /// @details Apply classifier-free guidance to the logits as described in academic paper "Stay on topic with Classifier-Free Guidance" https://arxiv.org/abs/2306.17806
|
|
1936
|
-
# /// @param
|
|
1937
|
-
# /// @
|
|
1938
|
-
# /// @
|
|
1939
|
-
# LLAMA_API void
|
|
1940
|
-
#
|
|
1965
|
+
# /// @param logits Logits extracted from the original generation context.
|
|
1966
|
+
# /// @param logits_guidance Logits extracted from a separate context from the same model. Other than a negative prompt at the beginning, it should have all generated and user input tokens copied from the main context.
|
|
1967
|
+
# /// @param scale Guidance strength. 1.0f means no guidance. Higher values mean stronger guidance.
|
|
1968
|
+
# LLAMA_API void llama_sample_apply_guidance(
|
|
1969
|
+
# struct llama_context * ctx,
|
|
1970
|
+
# float * logits,
|
|
1971
|
+
# float * logits_guidance,
|
|
1972
|
+
# float scale);
|
|
1973
|
+
def llama_sample_apply_guidance(
|
|
1974
|
+
ctx: llama_context_p,
|
|
1975
|
+
logits, # type: _Pointer[c_float]
|
|
1976
|
+
logits_guidance, # type: _Pointer[c_float]
|
|
1977
|
+
scale: Union[c_float, float],
|
|
1978
|
+
):
|
|
1979
|
+
"""Apply classifier-free guidance to the logits as described in academic paper "Stay on topic with Classifier-Free Guidance" https://arxiv.org/abs/2306.17806"""
|
|
1980
|
+
return _lib.llama_sample_apply_guidance(ctx, logits, logits_guidance, scale)
|
|
1981
|
+
|
|
1982
|
+
|
|
1983
|
+
_lib.llama_sample_apply_guidance.argtypes = [
|
|
1984
|
+
llama_context_p,
|
|
1985
|
+
c_float_p,
|
|
1986
|
+
c_float_p,
|
|
1987
|
+
c_float,
|
|
1988
|
+
]
|
|
1989
|
+
_lib.llama_sample_apply_guidance.restype = None
|
|
1990
|
+
|
|
1991
|
+
|
|
1992
|
+
# LLAMA_API DEPRECATED(void llama_sample_classifier_free_guidance(
|
|
1993
|
+
# struct llama_context * ctx,
|
|
1941
1994
|
# llama_token_data_array * candidates,
|
|
1942
|
-
#
|
|
1943
|
-
#
|
|
1995
|
+
# struct llama_context * guidance_ctx,
|
|
1996
|
+
# float scale),
|
|
1997
|
+
# "use llama_sample_apply_guidance() instead");
|
|
1944
1998
|
def llama_sample_classifier_free_guidance(
|
|
1945
1999
|
ctx: llama_context_p,
|
|
1946
2000
|
candidates, # type: _Pointer[llama_token_data_array]
|
|
@@ -1433,7 +1433,6 @@ class SchemaConverter:
|
|
|
1433
1433
|
|
|
1434
1434
|
def visit(self, schema: Dict[str, Any], name: str) -> str:
|
|
1435
1435
|
schema_type: Optional[str] = schema.get("type") # type: ignore
|
|
1436
|
-
assert isinstance(schema_type, str), f"Unrecognized schema: {schema}"
|
|
1437
1436
|
rule_name = name or "root"
|
|
1438
1437
|
|
|
1439
1438
|
if "$defs" in schema:
|