llama-cpp-python 0.2.27__tar.gz → 0.2.29__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- llama_cpp_python-0.2.29/.git/FETCH_HEAD +1 -0
- llama_cpp_python-0.2.29/.git/HEAD +1 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/config +1 -1
- llama_cpp_python-0.2.29/.git/index +0 -0
- llama_cpp_python-0.2.29/.git/logs/HEAD +1 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/HEAD +1 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/config +1 -1
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/index +0 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/logs/HEAD +2 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/logs/refs/heads/master +1 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/logs/refs/remotes/origin/HEAD +1 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/objects/pack/pack-089f43df9dfbcbef5693213d630b739a6bd96e17.idx +0 -0
- llama_cpp_python-0.2.27/.git/modules/vendor/llama.cpp/objects/pack/pack-780603ec965f7335ad2c7f37420dd671ac0b2ca0.pack → llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/objects/pack/pack-089f43df9dfbcbef5693213d630b739a6bd96e17.pack +0 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/objects/pack/pack-089f43df9dfbcbef5693213d630b739a6bd96e17.rev +0 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/packed-refs +2 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/refs/heads/master +1 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/refs/tags/b1878 +1 -0
- llama_cpp_python-0.2.29/.git/modules/vendor/llama.cpp/shallow +1 -0
- llama_cpp_python-0.2.29/.git/objects/02/c09afb0bf5559d3fe64ce67f4ff82af32ff50f +0 -0
- llama_cpp_python-0.2.29/.git/objects/03/6b2ddd1f34297fc03f715b82fd66945e9147ea +0 -0
- llama_cpp_python-0.2.29/.git/objects/1a/5152530cfbde487c928b60269a29fa5219f617 +0 -0
- llama_cpp_python-0.2.29/.git/objects/1b/78703a3fcd25c369a170cc7c94ca5a0a0e3baf +0 -0
- llama_cpp_python-0.2.29/.git/objects/4b/11fa83c00a3c04cfb47775ffcd226167d52044 +0 -0
- llama_cpp_python-0.2.29/.git/objects/50/6ab1f7ef5b87b110a38090b844b19b63c5bb8c +0 -0
- llama_cpp_python-0.2.29/.git/objects/65/206bf28d4bcaebea79c68bbd4e526aed5da6b3 +0 -0
- llama_cpp_python-0.2.29/.git/objects/6e/7ace3b7938f7c58a9ef2bf593c13691c03cf45 +0 -0
- llama_cpp_python-0.2.29/.git/objects/90/2a43919c5d79d1d418aee2d1512c2e92e8a00b +0 -0
- llama_cpp_python-0.2.29/.git/objects/9e/8e3cec752c06b0fd8cebdebbc6dcf7cade1a5a +0 -0
- llama_cpp_python-0.2.29/.git/objects/a4/5e5d77363eb85144d4aff1a3cbe86ce94d5c92 +0 -0
- llama_cpp_python-0.2.29/.git/objects/ba/14c5172dd87bbfcee083a5eac8c0511bb0c633 +0 -0
- llama_cpp_python-0.2.29/.git/objects/c0/2e656426ce672792fd20cb55c9616067974520 +0 -0
- llama_cpp_python-0.2.29/.git/objects/c0/748ee14e43d553bccbf402a4ed6c13b563b453 +0 -0
- llama_cpp_python-0.2.29/.git/objects/d1/ae9b564d3ab02c6b91162e52d822d36524edb3 +0 -0
- llama_cpp_python-0.2.29/.git/objects/e4/be9d1c98b789ed81b2d0fbdd28a441f267f489 +0 -0
- llama_cpp_python-0.2.29/.git/objects/ef/9392b7a3d1f6802cef539eea18185eb50c61af +2 -0
- llama_cpp_python-0.2.29/.git/objects/f7/b6ba6b1950c0c0a796d996f980e763bd9641cb +0 -0
- llama_cpp_python-0.2.29/.git/objects/f9/be3237d374ae1fa7e6d7e9587f17636b0a4f35 +0 -0
- llama_cpp_python-0.2.29/.git/refs/tags/v0.2.29 +1 -0
- llama_cpp_python-0.2.29/.git/shallow +1 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/CHANGELOG.md +15 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/PKG-INFO +1 -1
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/low_level_api/common.py +1 -1
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/low_level_api/low_level_api_chat_cpp.py +36 -14
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/__init__.py +1 -1
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/_utils.py +9 -11
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/llama.py +40 -1
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/llama_cpp.py +142 -32
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/llama_grammar.py +1 -2
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/server/model.py +19 -1
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/server/settings.py +8 -0
- llama_cpp_python-0.2.29/tests/test_grammar.py +52 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/package.nix +1 -1
- llama_cpp_python-0.2.29/vendor/llama.cpp/.github/workflows/nix-ci-aarch64.yml +55 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/nix-ci.yml +0 -41
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/nix-flake-update.yml +1 -1
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.gitignore +2 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/CMakeLists.txt +17 -7
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/Makefile +7 -10
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/Package.swift +2 -2
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/README.md +3 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/awq-py/README.md +1 -1
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/build-info.cpp +1 -1
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/common.cpp +75 -29
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/common.h +5 -1
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/sampling.cpp +5 -4
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert-hf-to-gguf.py +35 -13
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert.py +675 -312
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/CMakeLists.txt +2 -3
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/base-translate.sh +61 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched/batched.cpp +1 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched-bench/batched-bench.cpp +3 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/benchmark/benchmark-matmult.cpp +2 -2
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/export-lora/export-lora.cpp +1 -2
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/imatrix/CMakeLists.txt +5 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/imatrix/imatrix.cpp +380 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama-bench/llama-bench.cpp +104 -66
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/llama.swiftui/README.md +12 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.cpp.swift/LibLlama.swift +2 -5
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Models/LlamaState.swift +189 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/ContentView.swift +145 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/DownloadButton.swift +2 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/InputButton.swift +131 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui.xcodeproj/project.pbxproj +24 -89
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/clip.cpp +24 -38
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/llava-cli.cpp +3 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main/main.cpp +72 -24
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/passkey/CMakeLists.txt +5 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/passkey/README.md +12 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/passkey/passkey.cpp +296 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/pydantic-models-to-grammar-examples.py +136 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/examples/pydantic_models_to_grammar.py +1151 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize/quantize.cpp +132 -2
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/save-load-state/save-load-state.cpp +10 -11
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/README.md +40 -25
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/server.cpp +252 -126
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-alloc.c +28 -6
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-alloc.h +3 -1
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-backend-impl.h +20 -20
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-backend.c +479 -228
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-backend.h +36 -26
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-cuda.cu +1464 -528
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-cuda.h +7 -19
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-impl.h +2 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/ggml-metal.h +64 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-metal.m +632 -755
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-metal.metal +692 -8
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-opencl.cpp +321 -14
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-opencl.h +13 -3
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-quants.c +1963 -17
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-quants.h +32 -1
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml.c +186 -81
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml.h +22 -11
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/constants.py +3 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/tensor_mapping.py +9 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/llama.cpp +1247 -1609
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/llama.h +44 -8
- llama_cpp_python-0.2.29/vendor/llama.cpp/scripts/compare-llama-bench.py +374 -0
- llama_cpp_python-0.2.29/vendor/llama.cpp/scripts/get-pg.sh +70 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/sync-ggml-am.sh +13 -1
- llama_cpp_python-0.2.29/vendor/llama.cpp/scripts/sync-ggml.last +1 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-backend-ops.cpp +36 -9
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-quantize-fns.cpp +6 -0
- llama_cpp_python-0.2.27/.git/FETCH_HEAD +0 -1
- llama_cpp_python-0.2.27/.git/HEAD +0 -1
- llama_cpp_python-0.2.27/.git/index +0 -0
- llama_cpp_python-0.2.27/.git/logs/HEAD +0 -1
- llama_cpp_python-0.2.27/.git/modules/vendor/llama.cpp/HEAD +0 -1
- llama_cpp_python-0.2.27/.git/modules/vendor/llama.cpp/index +0 -0
- llama_cpp_python-0.2.27/.git/modules/vendor/llama.cpp/logs/HEAD +0 -2
- llama_cpp_python-0.2.27/.git/modules/vendor/llama.cpp/logs/refs/heads/master +0 -1
- llama_cpp_python-0.2.27/.git/modules/vendor/llama.cpp/logs/refs/remotes/origin/HEAD +0 -1
- llama_cpp_python-0.2.27/.git/modules/vendor/llama.cpp/objects/pack/pack-780603ec965f7335ad2c7f37420dd671ac0b2ca0.idx +0 -0
- llama_cpp_python-0.2.27/.git/modules/vendor/llama.cpp/objects/pack/pack-780603ec965f7335ad2c7f37420dd671ac0b2ca0.rev +0 -0
- llama_cpp_python-0.2.27/.git/modules/vendor/llama.cpp/packed-refs +0 -2
- llama_cpp_python-0.2.27/.git/modules/vendor/llama.cpp/refs/heads/master +0 -1
- llama_cpp_python-0.2.27/.git/modules/vendor/llama.cpp/refs/tags/b1768 +0 -1
- llama_cpp_python-0.2.27/.git/modules/vendor/llama.cpp/shallow +0 -1
- llama_cpp_python-0.2.27/.git/objects/0e/f132b07175867c07ad06fa22ca6b95eca67b59 +0 -0
- llama_cpp_python-0.2.27/.git/objects/17/1f357f53b0de535157a2c9b4de04582784ec97 +0 -0
- llama_cpp_python-0.2.27/.git/objects/2e/24903c21db75253911a70039ac5622672db813 +0 -0
- llama_cpp_python-0.2.27/.git/objects/34/6b4631ebd1f4af85e9988d4a528e00edba6375 +0 -0
- llama_cpp_python-0.2.27/.git/objects/44/b6d4a35d3caf0c65aef0a1c77ff0ab4077d405 +0 -0
- llama_cpp_python-0.2.27/.git/objects/4a/ada532e4c07996d15f35fbb0e053ed7238327d +0 -0
- llama_cpp_python-0.2.27/.git/objects/55/d08db5f514fb6847938e3d6489b99f737ba6e3 +0 -0
- llama_cpp_python-0.2.27/.git/objects/70/674ee3783520771a1c9deeff88342b55121213 +0 -0
- llama_cpp_python-0.2.27/.git/objects/75/d0527fd782a792af8612e55b0a3f2dad469ae9 +0 -0
- llama_cpp_python-0.2.27/.git/objects/91/78a22255fef8acfe298d0f27640f65f647d400 +0 -0
- llama_cpp_python-0.2.27/.git/objects/ae/c023cd61b3bb83bac968fffdd6aa0810af7c3d +0 -0
- llama_cpp_python-0.2.27/.git/objects/af/f397f476fb7773d0e89b0e8913c8b1f97ca3e4 +0 -0
- llama_cpp_python-0.2.27/.git/objects/b2/b18e810f9b8b3bc88b6687bfd7e12210775dcf +0 -0
- llama_cpp_python-0.2.27/.git/objects/b9/373b7ac641e6e9c8d8cc64951139205d91d8bc +0 -0
- llama_cpp_python-0.2.27/.git/objects/bc/f16655452a718aa2d16f05af570ab880c9e963 +0 -0
- llama_cpp_python-0.2.27/.git/objects/c8/4fd04498c2fb188ff7c2a59473035fc90eb990 +0 -0
- llama_cpp_python-0.2.27/.git/objects/ca/e7ebb7a833dafcd402a96bea3a9574f74f0ed5 +0 -0
- llama_cpp_python-0.2.27/.git/objects/d3/fe66b3a71dcb391ace338d29ce8f86763e26d2 +0 -0
- llama_cpp_python-0.2.27/.git/objects/ec/a6b9a87f90d847475d3aa1b77f18c4871a4c68 +0 -0
- llama_cpp_python-0.2.27/.git/refs/tags/v0.2.27 +0 -1
- llama_cpp_python-0.2.27/.git/shallow +0 -1
- llama_cpp_python-0.2.27/tests/test_grammar.py +0 -13
- llama_cpp_python-0.2.27/vendor/llama.cpp/examples/llama.swiftui/README.md +0 -7
- llama_cpp_python-0.2.27/vendor/llama.cpp/examples/llama.swiftui/llama.cpp.swift/bridging-header.h +0 -5
- llama_cpp_python-0.2.27/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Assets.xcassets/AccentColor.colorset/Contents.json +0 -11
- llama_cpp_python-0.2.27/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Models/LlamaState.swift +0 -100
- llama_cpp_python-0.2.27/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Preview Content/Preview Assets.xcassets/Contents.json +0 -6
- llama_cpp_python-0.2.27/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/ContentView.swift +0 -138
- llama_cpp_python-0.2.27/vendor/llama.cpp/examples/metal/CMakeLists.txt +0 -4
- llama_cpp_python-0.2.27/vendor/llama.cpp/examples/metal/metal.cpp +0 -103
- llama_cpp_python-0.2.27/vendor/llama.cpp/ggml-metal.h +0 -115
- llama_cpp_python-0.2.27/vendor/llama.cpp/scripts/sync-ggml.last +0 -1
- llama_cpp_python-0.2.27/vendor/llama.cpp/spm-headers/ggml.h +0 -1
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.dockerignore +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/description +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/applypatch-msg.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/commit-msg.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/fsmonitor-watchman.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/post-update.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/pre-applypatch.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/pre-commit.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/pre-merge-commit.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/pre-push.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/pre-rebase.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/pre-receive.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/prepare-commit-msg.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/push-to-checkout.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/sendemail-validate.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/hooks/update.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/info/exclude +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/description +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/applypatch-msg.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/commit-msg.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/fsmonitor-watchman.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/post-update.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-applypatch.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-commit.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-merge-commit.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-push.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-rebase.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/pre-receive.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/prepare-commit-msg.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/push-to-checkout.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/sendemail-validate.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/hooks/update.sample +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/info/exclude +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/modules/vendor/llama.cpp/refs/remotes/origin/HEAD +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/04/5856ea2ffe697ec33db1c1c989bd45cde5bb3d +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/04/7bc14424303575f73af90611fec827334f54e8 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/0d/870969f4b23bd92a09ec29134d3fb454d38bec +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/0e/2a907c0e40de1a432ee0cd2e3d01c634df1a37 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/0e/f7bd4a856ec728adc565133e808628ea5566a1 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/11/2a0f7872fa9244bf38729a2722dc5c08dec20c +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/11/b6d5c26e3f7157658952b8ec353e985d522fac +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/13/c5b6b0df5f67e80cbe584909b83777901265a1 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/19/9bd4ffbf88c68c98b52c05f388dfa92716f6b7 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/23/e37d4d40e5ec0bfd85b5e928834d58e2cf0da6 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/24/04228325d88c59b819acaedb20b15635f75df9 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/27/2e4767b47397d1529e6a2d01298144d9d746ba +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/27/a6b1e5042318f85dc99c9f24f4dd6fc472d242 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/29/03e0146d304bcacbfabfe71f171a2edc03043e +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/2c/c6fb02dcb3226c1ecf0fbed6453eb3acadeaa2 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/39/697bfc2538bd4558018d0d721d6d6028c4bb56 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/3a/1d7180d508818fe957923e00dcd8950938632d +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/3a/6457dcdfd47e764654bacae0ba8347976b645a +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/41/cc68ea2402cf682807649d841e7c0f4175db01 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/47/4503fdfc554d8caabee4f321a80427f8c7d696 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/4b/3189dd1a54be3bc416786ddf184dd047dc4b20 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/51/f357200f8b998031f4be924e11ed2ae4bf3fea +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/56/2410fe1a4c4093d62e1705933eaf66c6d99a2c +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/5b/51e98ce432974ff031367f8937babe755e3d73 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/5f/350ffe99abe7297b2839f36fd0eaeb98887805 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/60/bc7aef42aac0409cfdca666ad2ff6f516d7b5b +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/61/027ef99725c50b0891fdbf0bf263a33abe648f +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/68/7316b327ca038d26a338b3070a7d4698322515 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/74/7c6130e3cb1479d20e2013b1dd3db3379c2266 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/76/e26fbd106895fba52861f8ac1e11cc6ee2a307 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/79/5dad726ae91f330c56e49bc188080b5b3b5ba9 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/79/a9e67a1aee09c6d182f240ba5eef32feabcbce +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/7a/7b899ec7dd48d192cba14ac9c8e9df4233f7fb +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/7d/5498f9d2c49c1f731b47845d845f6c5e16a3d9 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/7d/6c970483161eaf43cfa9d50010c071d4953053 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/7e/df0975dc12ccc95ad14de085f07efe6d65c620 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/7e/e8f748eab47180cea09c0ad8e75c3b991b4af4 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/80/7b0f57a8a873e58ade0ff0f5b0bcf0ff66b7f9 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/82/e5c4487e57d6d59c901a73bdd2a9bc172fee7c +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/8b/d03f88a1895cbf3ef249e13df79ee0efda779d +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/8e/32d2c0edce725a47b5845463133919cd766a61 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/91/abb11fdf507883caeeb2d2958e1c65fb6cbdc1 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/99/32d6130f5552a9b85c8b15b4ac6bc26b1068ce +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/9d/0ec2f705618e591cfa8d6512cb9a96b3da75f1 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/9d/3d3559849603efda6f3c8181684e4d19e0ec79 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/a9/e51cdc1672134ec9af66c9eccf09f6da4ceccd +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/ac/82b8fbb81087ec9b3a72d9e377102a31b28d16 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/b1/f90b91594f496ad9f27b1a68584984f4b523d2 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/b2/e879ec4bfb319459dd5357313ef06158c7039f +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/b5/affaa9d6087f3888dd9eedea209bb214b6e135 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/b9/1632f5bc787c1404600c894a6a4126359747d8 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/bb/cbbe7d61558adde3cbfd0c7a63a67c27ed6d30 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/c5/4e4eb5ce2636abd78df46a7616cfe9196a1198 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/c8/5e73d2b657bb05ed99309615d67bac93d9f86e +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/ca/ebbb67fdb02a0a8897d4e4826ea046a9931f6f +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/cc/6a3a7252ea6e698614f0629d4bc040ab6ca717 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/cd/351ba33849dcf6af35b493f7405962fa1625d4 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/d3/329eec3bac6ce7e54c76b77ac9bf99fab0fe3f +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/d3/efb3a6fe1e001db62ec08e5d31ce1d08567045 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/da/c33b74dddf06fcfc01244044eebb102cfcea37 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/e2/13518b95011cb6ee783986624c3b6de8659f81 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/e4/1f375774e6945e445bfb179502b128fe22dda7 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/e6/9de29bb2d1d6434b8b29ae775ad8c2e48c5391 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/e9/30609ff5c479a1d5e12a8f3993582d421a6326 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/eb/0fb9662e690d0f9de4632cddd321b3f872a725 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/eb/9a2cfa9167df02f136502af79738c71363abfd +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/ef/1b2c0162e8edd321e2b9c1ce375d96f1f1d048 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/f0/827d762e852a21f6406c469300899d5f509b8f +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/f1/b8e9d154231932c4b7b9b59611626764e68632 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/f2/0813765a70679e8a063871c9ef75d75c65ccb6 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/fa/dfc5fb4fe6f5eb6d5d98b62519e374a5202b00 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/fc/25ff5160028dee3570249abc40cd57780bcca9 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/fc/ef8cd800ee8a265b146748d178cb56b5632bf3 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/fd/64c09b37947c97e58903ce570785c657d56722 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/fe/b0ed68d94eac48b844fd587ddfb808649716a1 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.git/objects/ff/3e950cd1110fe552912cea4c268c4023d2b737 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.github/dependabot.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.github/workflows/build-and-release.yaml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.github/workflows/build-docker.yaml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.github/workflows/publish-to-test.yaml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.github/workflows/publish.yaml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.github/workflows/test-pypi.yaml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.github/workflows/test.yaml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.gitignore +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.gitmodules +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/.readthedocs.yaml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/LICENSE.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/Makefile +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docker/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docker/cuda_simple/Dockerfile +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docker/open_llama/Dockerfile +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docker/open_llama/build.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docker/open_llama/hug_model.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docker/open_llama/start.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docker/open_llama/start_server.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docker/openblas_simple/Dockerfile +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docker/simple/Dockerfile +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docker/simple/run.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docs/api-reference.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docs/changelog.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docs/index.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docs/install/macos.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docs/requirements.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/docs/server.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/high_level_api/fastapi_server.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/high_level_api/high_level_api_embedding.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/high_level_api/high_level_api_inference.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/high_level_api/high_level_api_streaming.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/high_level_api/langchain_custom_llm.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/low_level_api/Chat.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/low_level_api/Miku.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/low_level_api/ReasonAct.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/low_level_api/low_level_api_llama_cpp.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/low_level_api/quantize.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/low_level_api/readme/low_level_api_llama_cpp.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/low_level_api/util.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/notebooks/Batching.ipynb +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/notebooks/Clients.ipynb +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/notebooks/Functions.ipynb +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/notebooks/Guidance.ipynb +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/notebooks/Multimodal.ipynb +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/notebooks/PerformanceTuning.ipynb +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/llama_chat_format.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/llama_types.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/llava_cpp.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/py.typed +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/server/__init__.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/server/__main__.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/server/app.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/server/cli.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/server/errors.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/llama_cpp/server/types.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/mkdocs.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/pyproject.toml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/tests/test_llama.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.clang-tidy +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/cloud-v-pipeline +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/full-cuda.Dockerfile +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/full-rocm.Dockerfile +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/full.Dockerfile +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/main-cuda.Dockerfile +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/main-rocm.Dockerfile +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/main.Dockerfile +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/apps.nix +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/devshells.nix +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/jetson-support.nix +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/nixpkgs-instances.nix +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/nix/scope.nix +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.devops/tools.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.dockerignore +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.ecrc +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.editorconfig +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.flake8 +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.git +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/ISSUE_TEMPLATE/bug.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/ISSUE_TEMPLATE/enhancement.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/build.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/code-coverage.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/docker.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/editorconfig.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/gguf-publish.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/nix-publish-flake.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/python-check-requirements.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/python-lint.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/tidy-post.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/tidy-review.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.github/workflows/zig-build.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/.pre-commit-config.yaml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/LICENSE +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/SHA256SUMS +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/awq-py/awq/apply_awq.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/awq-py/requirements.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/build.zig +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ci/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ci/run.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/cmake/FindSIMD.cmake +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/codecov.yml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/base64.hpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/build-info.cpp.in +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/console.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/console.h +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/grammar-parser.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/grammar-parser.h +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/log.h +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/sampling.h +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/stb_image.h +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/train.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/common/train.h +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert-llama-ggml-to-gguf.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert-lora-to-ggml.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/convert-persimmon-to-gguf.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/docs/BLIS.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/docs/llama-star/idea-arch.key +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/docs/llama-star/idea-arch.pdf +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/docs/token_generation_performance_tips.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/Miku.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/alpaca.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/baby-llama/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/baby-llama/baby-llama.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched-bench/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched-bench/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/.gitignore +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/Makefile +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/Package.swift +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/batched.swift/Sources/main.swift +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/beam-search/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/beam-search/beam-search.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/benchmark/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat-13B.bat +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat-13B.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat-persistent.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat-vicuna.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/chat.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/convert-llama2c-to-ggml/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/convert-llama2c-to-ggml/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/convert-llama2c-to-ggml/convert-llama2c-to-ggml.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/embedding/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/embedding/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/embedding/embedding.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/export-lora/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/export-lora/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/convert-finetune-checkpoint-to-gguf.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/finetune.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/finetune/finetune.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/gguf/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/gguf/gguf.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/gpt4all.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/infill/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/infill/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/infill/infill.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/graph.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/jeopardy.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/qasheet.csv +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/jeopardy/questions.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/json-schema-to-grammar.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama-bench/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama-bench/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/.gitignore +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Assets.xcassets/AppIcon.appiconset/Contents.json +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/Assets.xcassets/Contents.json +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/UI/LoadCustomButton.swift +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui/llama_swiftuiApp.swift +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui.xcodeproj/project.xcworkspace/contents.xcworkspacedata +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.swiftui/llama.swiftui.xcodeproj/project.xcworkspace/xcshareddata/IDEWorkspaceChecks.plist +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama.vim +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama2-13b.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llama2.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/clip.h +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/convert-image-encoder-to-gguf.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/llava-surgery.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/llava.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llava/llava.h +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/llm.vim +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookahead/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookahead/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookahead/lookahead.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookup/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookup/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/lookup/lookup.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main-cmake-pkg/.gitignore +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main-cmake-pkg/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/main-cmake-pkg/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/make-ggml.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/parallel/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/parallel/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/parallel/parallel.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/perplexity/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/perplexity/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/perplexity/perplexity.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize-stats/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/quantize-stats/quantize-stats.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/reason-act.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/save-load-state/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/api_like_OAI.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/chat-llama2.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/chat.mjs +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/chat.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/completion.js.hpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/deps.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/httplib.h +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/index.html.hpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/index.js.hpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/json-schema-to-grammar.mjs.hpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/json.hpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/public/completion.js +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/public/index.html +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/public/index.js +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server/public/json-schema-to-grammar.mjs +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/server-llama2-13B.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/simple/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/simple/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/simple/simple.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/speculative/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/speculative/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/speculative/speculative.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/tokenize/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/tokenize/tokenize.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/train-text-from-scratch/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/train-text-from-scratch/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/train-text-from-scratch/convert-train-checkpoint-to-gguf.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/examples/train-text-from-scratch/train-text-from-scratch.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/flake.lock +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/flake.nix +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-mpi.c +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/ggml-mpi.h +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/LICENSE +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/examples/writer.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/__init__.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/gguf.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/gguf_reader.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/gguf_writer.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/py.typed +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/gguf/vocab.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/pyproject.toml +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/scripts/__init__.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/scripts/gguf-convert-endian.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/scripts/gguf-dump.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/scripts/gguf-set-metadata.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/gguf-py/tests/test_gguf.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/README.md +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/arithmetic.gbnf +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/c.gbnf +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/chess.gbnf +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/japanese.gbnf +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/json.gbnf +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/json_arr.gbnf +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/grammars/list.gbnf +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama-leader.jpeg +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama0-banner.png +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama0-logo.png +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama1-banner.png +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/media/llama1-logo.png +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/mypy.ini +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/pocs/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/pocs/vdot/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/pocs/vdot/q8dot.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/pocs/vdot/vdot.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/LLM-questions.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/alpaca.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/assistant.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-baichuan.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-bob.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-qwen.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-vicuna-v0.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat-with-vicuna-v1.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/chat.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/dan-modified.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/dan.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/mnemonics.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/parallel-questions.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/prompts/reason-act.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert-hf-to-gguf.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert-llama-ggml-to-gguf.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert-lora-to-ggml.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert-persimmon-to-gguf.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements/requirements-convert.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/requirements.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/run_with_preset.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/LlamaConfig.cmake.in +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/build-info.cmake +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/build-info.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/check-requirements.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/convert-gg.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/gen-build-info-cpp.cmake +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/get-flags.mk +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/get-wikitext-2.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/qnt-all.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/run-all-perf.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/run-all-ppl.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/server-llm.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/sync-ggml.sh +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/scripts/verify-checksum-models.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/spm-headers/llama.h +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/CMakeLists.txt +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-c.c +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-double-float.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-grad0.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-grammar-parser.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-llama-grammar.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-opt.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-quantize-perf.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-rope.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-sampling.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-0-falcon.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-0-falcon.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-0-llama.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-0-llama.py +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-1-bpe.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/tests/test-tokenizer-1-llama.cpp +0 -0
- {llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/vendor/llama.cpp/unicode.h +0 -0
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4b11fa83c00a3c04cfb47775ffcd226167d52044 '4b11fa83c00a3c04cfb47775ffcd226167d52044' of https://github.com/abetlen/llama-cpp-python
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4b11fa83c00a3c04cfb47775ffcd226167d52044
|
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
[gc]
|
|
10
10
|
auto = 0
|
|
11
11
|
[http "https://github.com/"]
|
|
12
|
-
extraheader = AUTHORIZATION: basic
|
|
12
|
+
extraheader = AUTHORIZATION: basic eC1hY2Nlc3MtdG9rZW46Z2hzXzg0QXZkVFUxdjRsWmlJSlFjZHVISHVlZnBtUnA3STFDcUxkeA==
|
|
13
13
|
[submodule "vendor/llama.cpp"]
|
|
14
14
|
active = true
|
|
15
15
|
url = https://github.com/ggerganov/llama.cpp.git
|
|
Binary file
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
0000000000000000000000000000000000000000 4b11fa83c00a3c04cfb47775ffcd226167d52044 runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341384 +0000 checkout: moving from master to refs/tags/v0.2.29
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4483396751c79dea540808b9cb9238245d06da2b
|
|
@@ -13,7 +13,7 @@
|
|
|
13
13
|
[gc]
|
|
14
14
|
auto = 0
|
|
15
15
|
[http "https://github.com/"]
|
|
16
|
-
extraheader = AUTHORIZATION: basic
|
|
16
|
+
extraheader = AUTHORIZATION: basic eC1hY2Nlc3MtdG9rZW46Z2hzXzg0QXZkVFUxdjRsWmlJSlFjZHVISHVlZnBtUnA3STFDcUxkeA==
|
|
17
17
|
[url "https://github.com/"]
|
|
18
18
|
insteadOf = git@github.com:
|
|
19
19
|
insteadOf = org-6826477@github.com:
|
|
Binary file
|
|
@@ -0,0 +1,2 @@
|
|
|
1
|
+
0000000000000000000000000000000000000000 4483396751c79dea540808b9cb9238245d06da2b runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341385 +0000 clone: from https://github.com/ggerganov/llama.cpp.git
|
|
2
|
+
4483396751c79dea540808b9cb9238245d06da2b 4483396751c79dea540808b9cb9238245d06da2b runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341385 +0000 checkout: moving from master to 4483396751c79dea540808b9cb9238245d06da2b
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
0000000000000000000000000000000000000000 4483396751c79dea540808b9cb9238245d06da2b runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341385 +0000 clone: from https://github.com/ggerganov/llama.cpp.git
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
0000000000000000000000000000000000000000 4483396751c79dea540808b9cb9238245d06da2b runner <runner@fv-az651-417.mi4nuvdbnkburlvweydx3iqepe.ex.internal.cloudapp.net> 1705341385 +0000 clone: from https://github.com/ggerganov/llama.cpp.git
|
|
Binary file
|
|
Binary file
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4483396751c79dea540808b9cb9238245d06da2b
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4483396751c79dea540808b9cb9238245d06da2b
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4483396751c79dea540808b9cb9238245d06da2b
|
|
@@ -0,0 +1,2 @@
|
|
|
1
|
+
x}TM��0�Y�bPj��%�[ ��K�S��R�lM-��J����w4�Xg7�A���潑�u5���w�띏ж�SU��b,<g��� �-�=l6�)��N#o��d&�k�#s)�s��"���1���U�)_������,��g���Ζ�O��ǁS,9�^�4R��]T��l���& D�#�*c5�J��[�ɐ �0�gq�q4�����Z�h�)�(EO��o�@0Ny�~���1MK9����8��W06.q��JK�z �%AZ���戝��y��wV���!R;�R�mU�g,Xz����#�2jN֥8������Dճ3�Q{�i��<�&��{�,��5 r�(���M�˽w=��A�H�P2��"�d)�A�s�����~�4�#=�<�eM����d��V`���'
|
|
2
|
+
.�����-����3��O9V<��R.�����n~1����L����_�H���y�W9/�{9ݕ�_��i����ҺЧ��P��A�Յ�����/]�X%
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4b11fa83c00a3c04cfb47775ffcd226167d52044
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
4b11fa83c00a3c04cfb47775ffcd226167d52044
|
|
@@ -7,6 +7,21 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
|
|
|
7
7
|
|
|
8
8
|
## [Unreleased]
|
|
9
9
|
|
|
10
|
+
## [0.2.29]
|
|
11
|
+
|
|
12
|
+
- feat: Update llama.cpp to ggerganov/llama.cpp@4483396751c79dea540808b9cb9238245d06da2b
|
|
13
|
+
- feat: Add split_mode option by @abetlen in 84615adbc6855c8384807c42f0130f9a1763f99d
|
|
14
|
+
- feat: Implement GGUF metadata KV overrides by @phiharri in #1011
|
|
15
|
+
- fix: Avoid "LookupError: unknown encoding: ascii" when open() called in a destructor by @yieldthought in #1012
|
|
16
|
+
- fix: Fix low_level_api_chat_cpp example to match current API by @aniljava in #1086
|
|
17
|
+
- fix: Fix Pydantic model parsing by @DeNeutoy in #1087
|
|
18
|
+
|
|
19
|
+
## [0.2.28]
|
|
20
|
+
|
|
21
|
+
- feat: Update llama.cpp to ggerganov/llama.cpp@6efb8eb30e7025b168f3fda3ff83b9b386428ad6
|
|
22
|
+
- feat: Add ability to pass in penalize_nl param by @shankinson in #1068
|
|
23
|
+
- fix: print_grammar to stderr by @turian in #1052
|
|
24
|
+
|
|
10
25
|
## [0.2.27]
|
|
11
26
|
|
|
12
27
|
- feat: Update llama.cpp to ggerganov/llama.cpp@b3a7c20b5c035250257d2b62851c379b159c899a
|
|
@@ -106,7 +106,7 @@ def gpt_params_parse(argv = None):
|
|
|
106
106
|
parser.add_argument("--mirostat_lr", type=float, default=0.1, help="Mirostat learning rate, parameter eta",dest="mirostat_eta")
|
|
107
107
|
|
|
108
108
|
parser.add_argument("-m", "--model", type=str, default="./models/llama-7B/ggml-model.bin", help="model path",dest="model")
|
|
109
|
-
parser.add_argument("-p", "--prompt", type=str, default=
|
|
109
|
+
parser.add_argument("-p", "--prompt", type=str, default=None, help="initial prompt",dest="prompt")
|
|
110
110
|
parser.add_argument("-f", "--file", type=str, default=None, help="file containing initial prompt to load",dest="file")
|
|
111
111
|
parser.add_argument("--session", type=str, default=None, help="file to cache model state in (may be large!)",dest="path_session")
|
|
112
112
|
parser.add_argument("--in-prefix", type=str, default="", help="string to prefix user inputs with", dest="input_prefix")
|
{llama_cpp_python-0.2.27 → llama_cpp_python-0.2.29}/examples/low_level_api/low_level_api_chat_cpp.py
RENAMED
|
@@ -62,7 +62,7 @@ specified) expect poor results""", file=sys.stderr)
|
|
|
62
62
|
self.multibyte_fix = []
|
|
63
63
|
|
|
64
64
|
# model load
|
|
65
|
-
self.lparams = llama_cpp.
|
|
65
|
+
self.lparams = llama_cpp.llama_model_default_params()
|
|
66
66
|
self.lparams.n_ctx = self.params.n_ctx
|
|
67
67
|
self.lparams.n_parts = self.params.n_parts
|
|
68
68
|
self.lparams.seed = self.params.seed
|
|
@@ -72,7 +72,11 @@ specified) expect poor results""", file=sys.stderr)
|
|
|
72
72
|
|
|
73
73
|
self.model = llama_cpp.llama_load_model_from_file(
|
|
74
74
|
self.params.model.encode("utf8"), self.lparams)
|
|
75
|
-
|
|
75
|
+
|
|
76
|
+
# Context Params.
|
|
77
|
+
self.cparams = llama_cpp.llama_context_default_params()
|
|
78
|
+
|
|
79
|
+
self.ctx = llama_cpp.llama_new_context_with_model(self.model, self.cparams)
|
|
76
80
|
if (not self.ctx):
|
|
77
81
|
raise RuntimeError(f"error: failed to load model '{self.params.model}'")
|
|
78
82
|
|
|
@@ -244,7 +248,7 @@ n_keep = {self.params.n_keep}
|
|
|
244
248
|
# tokenize a prompt
|
|
245
249
|
def _tokenize(self, prompt, bos=True):
|
|
246
250
|
_arr = (llama_cpp.llama_token * ((len(prompt) + 1) * 4))()
|
|
247
|
-
_n = llama_cpp.llama_tokenize(self.
|
|
251
|
+
_n = llama_cpp.llama_tokenize(self.model, prompt.encode("utf8", errors="ignore"), len(prompt), _arr, len(_arr), bos, False)
|
|
248
252
|
return _arr[:_n]
|
|
249
253
|
|
|
250
254
|
def set_color(self, c):
|
|
@@ -304,7 +308,7 @@ n_keep = {self.params.n_keep}
|
|
|
304
308
|
self.n_past += n_eval"""
|
|
305
309
|
|
|
306
310
|
if (llama_cpp.llama_eval(
|
|
307
|
-
self.ctx, (llama_cpp.llama_token * len(self.embd))(*self.embd), len(self.embd), self.n_past
|
|
311
|
+
self.ctx, (llama_cpp.llama_token * len(self.embd))(*self.embd), len(self.embd), self.n_past
|
|
308
312
|
) != 0):
|
|
309
313
|
raise Exception("Failed to llama_eval!")
|
|
310
314
|
|
|
@@ -332,7 +336,7 @@ n_keep = {self.params.n_keep}
|
|
|
332
336
|
id = 0
|
|
333
337
|
|
|
334
338
|
logits = llama_cpp.llama_get_logits(self.ctx)
|
|
335
|
-
n_vocab = llama_cpp.llama_n_vocab(self.
|
|
339
|
+
n_vocab = llama_cpp.llama_n_vocab(self.model)
|
|
336
340
|
|
|
337
341
|
# Apply params.logit_bias map
|
|
338
342
|
for key, value in self.params.logit_bias.items():
|
|
@@ -349,12 +353,20 @@ n_keep = {self.params.n_keep}
|
|
|
349
353
|
last_n_repeat = min(len(self.last_n_tokens), repeat_last_n, self.n_ctx)
|
|
350
354
|
|
|
351
355
|
_arr = (llama_cpp.llama_token * last_n_repeat)(*self.last_n_tokens[len(self.last_n_tokens) - last_n_repeat:])
|
|
352
|
-
llama_cpp.
|
|
353
|
-
|
|
354
|
-
|
|
355
|
-
|
|
356
|
-
|
|
357
|
-
|
|
356
|
+
llama_cpp.llama_sample_repetition_penalties(
|
|
357
|
+
ctx=self.ctx,
|
|
358
|
+
candidates=candidates_p,
|
|
359
|
+
last_tokens_data = _arr,
|
|
360
|
+
penalty_last_n = last_n_repeat,
|
|
361
|
+
penalty_repeat = llama_cpp.c_float(self.params.repeat_penalty),
|
|
362
|
+
penalty_freq = llama_cpp.c_float(self.params.frequency_penalty),
|
|
363
|
+
penalty_present = llama_cpp.c_float(self.params.presence_penalty),
|
|
364
|
+
)
|
|
365
|
+
|
|
366
|
+
# NOT PRESENT IN CURRENT VERSION ?
|
|
367
|
+
# llama_cpp.llama_sample_frequency_and_presence_penalti(self.ctx, candidates_p,
|
|
368
|
+
# _arr,
|
|
369
|
+
# last_n_repeat, llama_cpp.c_float(self.params.frequency_penalty), llama_cpp.c_float(self.params.presence_penalty))
|
|
358
370
|
|
|
359
371
|
if not self.params.penalize_nl:
|
|
360
372
|
logits[llama_cpp.llama_token_nl()] = nl_logit
|
|
@@ -473,7 +485,7 @@ n_keep = {self.params.n_keep}
|
|
|
473
485
|
def token_to_str(self, token_id: int) -> bytes:
|
|
474
486
|
size = 32
|
|
475
487
|
buffer = (ctypes.c_char * size)()
|
|
476
|
-
n = llama_cpp.
|
|
488
|
+
n = llama_cpp.llama_token_to_piece(
|
|
477
489
|
self.model, llama_cpp.llama_token(token_id), buffer, size)
|
|
478
490
|
assert n <= size
|
|
479
491
|
return bytes(buffer[:n])
|
|
@@ -532,6 +544,9 @@ n_keep = {self.params.n_keep}
|
|
|
532
544
|
print(i,end="",flush=True)
|
|
533
545
|
self.params.input_echo = False
|
|
534
546
|
|
|
547
|
+
# Using string instead of tokens to check for antiprompt,
|
|
548
|
+
# It is more reliable than tokens for interactive mode.
|
|
549
|
+
generated_str = ""
|
|
535
550
|
while self.params.interactive:
|
|
536
551
|
self.set_color(util.CONSOLE_COLOR_USER_INPUT)
|
|
537
552
|
if (self.params.instruct):
|
|
@@ -546,6 +561,10 @@ n_keep = {self.params.n_keep}
|
|
|
546
561
|
try:
|
|
547
562
|
for i in self.output():
|
|
548
563
|
print(i,end="",flush=True)
|
|
564
|
+
generated_str += i
|
|
565
|
+
for ap in self.params.antiprompt:
|
|
566
|
+
if generated_str.endswith(ap):
|
|
567
|
+
raise KeyboardInterrupt
|
|
549
568
|
except KeyboardInterrupt:
|
|
550
569
|
self.set_color(util.CONSOLE_COLOR_DEFAULT)
|
|
551
570
|
if not self.params.instruct:
|
|
@@ -561,7 +580,7 @@ if __name__ == "__main__":
|
|
|
561
580
|
time_now = datetime.now()
|
|
562
581
|
prompt = f"""Text transcript of a never ending dialog, where {USER_NAME} interacts with an AI assistant named {AI_NAME}.
|
|
563
582
|
{AI_NAME} is helpful, kind, honest, friendly, good at writing and never fails to answer {USER_NAME}’s requests immediately and with details and precision.
|
|
564
|
-
|
|
583
|
+
Transcript below contains only the recorded dialog between two, without any annotations like (30 seconds passed...) or (to himself), just what {USER_NAME} and {AI_NAME} say aloud to each other.
|
|
565
584
|
The dialog lasts for years, the entirety of it is shared below. It's 10000 pages long.
|
|
566
585
|
The transcript only includes text, it does not include markup like HTML and Markdown.
|
|
567
586
|
|
|
@@ -575,8 +594,11 @@ The transcript only includes text, it does not include markup like HTML and Mark
|
|
|
575
594
|
{AI_NAME}: A cat is a domestic species of small carnivorous mammal. It is the only domesticated species in the family Felidae.
|
|
576
595
|
{USER_NAME}: Name a color.
|
|
577
596
|
{AI_NAME}: Blue
|
|
578
|
-
{USER_NAME}:"""
|
|
597
|
+
{USER_NAME}: """
|
|
598
|
+
|
|
579
599
|
params = gpt_params_parse()
|
|
600
|
+
if params.prompt is None and params.file is None:
|
|
601
|
+
params.prompt = prompt
|
|
580
602
|
|
|
581
603
|
with LLaMAInteract(params) as m:
|
|
582
604
|
m.interact()
|
|
@@ -1,11 +1,15 @@
|
|
|
1
1
|
import os
|
|
2
2
|
import sys
|
|
3
3
|
|
|
4
|
+
import sys, traceback
|
|
5
|
+
|
|
6
|
+
# Avoid "LookupError: unknown encoding: ascii" when open() called in a destructor
|
|
7
|
+
outnull_file = open(os.devnull, "w")
|
|
8
|
+
errnull_file = open(os.devnull, "w")
|
|
4
9
|
|
|
5
10
|
class suppress_stdout_stderr(object):
|
|
6
11
|
# NOTE: these must be "saved" here to avoid exceptions when using
|
|
7
12
|
# this context manager inside of a __del__ method
|
|
8
|
-
open = open
|
|
9
13
|
sys = sys
|
|
10
14
|
os = os
|
|
11
15
|
|
|
@@ -21,9 +25,6 @@ class suppress_stdout_stderr(object):
|
|
|
21
25
|
if not hasattr(self.sys.stdout, 'fileno') or not hasattr(self.sys.stderr, 'fileno'):
|
|
22
26
|
return self # Return the instance without making changes
|
|
23
27
|
|
|
24
|
-
self.outnull_file = self.open(self.os.devnull, "w")
|
|
25
|
-
self.errnull_file = self.open(self.os.devnull, "w")
|
|
26
|
-
|
|
27
28
|
self.old_stdout_fileno_undup = self.sys.stdout.fileno()
|
|
28
29
|
self.old_stderr_fileno_undup = self.sys.stderr.fileno()
|
|
29
30
|
|
|
@@ -33,11 +34,11 @@ class suppress_stdout_stderr(object):
|
|
|
33
34
|
self.old_stdout = self.sys.stdout
|
|
34
35
|
self.old_stderr = self.sys.stderr
|
|
35
36
|
|
|
36
|
-
self.os.dup2(
|
|
37
|
-
self.os.dup2(
|
|
37
|
+
self.os.dup2(outnull_file.fileno(), self.old_stdout_fileno_undup)
|
|
38
|
+
self.os.dup2(errnull_file.fileno(), self.old_stderr_fileno_undup)
|
|
38
39
|
|
|
39
|
-
self.sys.stdout =
|
|
40
|
-
self.sys.stderr =
|
|
40
|
+
self.sys.stdout = outnull_file
|
|
41
|
+
self.sys.stderr = errnull_file
|
|
41
42
|
return self
|
|
42
43
|
|
|
43
44
|
def __exit__(self, *_):
|
|
@@ -54,6 +55,3 @@ class suppress_stdout_stderr(object):
|
|
|
54
55
|
|
|
55
56
|
self.os.close(self.old_stdout_fileno)
|
|
56
57
|
self.os.close(self.old_stderr_fileno)
|
|
57
|
-
|
|
58
|
-
self.outnull_file.close()
|
|
59
|
-
self.errnull_file.close()
|
|
@@ -730,11 +730,13 @@ class Llama:
|
|
|
730
730
|
*,
|
|
731
731
|
# Model Params
|
|
732
732
|
n_gpu_layers: int = 0,
|
|
733
|
+
split_mode: int = llama_cpp.LLAMA_SPLIT_LAYER,
|
|
733
734
|
main_gpu: int = 0,
|
|
734
735
|
tensor_split: Optional[List[float]] = None,
|
|
735
736
|
vocab_only: bool = False,
|
|
736
737
|
use_mmap: bool = True,
|
|
737
738
|
use_mlock: bool = False,
|
|
739
|
+
kv_overrides: Optional[Dict[str, Union[bool, int, float]]] = None,
|
|
738
740
|
# Context Params
|
|
739
741
|
seed: int = llama_cpp.LLAMA_DEFAULT_SEED,
|
|
740
742
|
n_ctx: int = 512,
|
|
@@ -798,11 +800,13 @@ class Llama:
|
|
|
798
800
|
Args:
|
|
799
801
|
model_path: Path to the model.
|
|
800
802
|
n_gpu_layers: Number of layers to offload to GPU (-ngl). If -1, all layers are offloaded.
|
|
801
|
-
|
|
803
|
+
split_mode: How to split the model across GPUs. See llama_cpp.LLAMA_SPLIT_* for options.
|
|
804
|
+
main_gpu: main_gpu interpretation depends on split_mode: LLAMA_SPLIT_NONE: the GPU that is used for the entire model. LLAMA_SPLIT_ROW: the GPU that is used for small tensors and intermediate results. LLAMA_SPLIT_LAYER: ignored
|
|
802
805
|
tensor_split: How split tensors should be distributed across GPUs. If None, the model is not split.
|
|
803
806
|
vocab_only: Only load the vocabulary no weights.
|
|
804
807
|
use_mmap: Use mmap if possible.
|
|
805
808
|
use_mlock: Force the system to keep the model in RAM.
|
|
809
|
+
kv_overrides: Key-value overrides for the model.
|
|
806
810
|
seed: RNG seed, -1 for random
|
|
807
811
|
n_ctx: Text context, 0 = from model
|
|
808
812
|
n_batch: Prompt processing maximum batch size
|
|
@@ -848,6 +852,7 @@ class Llama:
|
|
|
848
852
|
self.model_params.n_gpu_layers = (
|
|
849
853
|
0x7FFFFFFF if n_gpu_layers == -1 else n_gpu_layers
|
|
850
854
|
) # 0x7FFFFFFF is INT32 max, will be auto set to all layers
|
|
855
|
+
self.model_params.split_mode = split_mode
|
|
851
856
|
self.model_params.main_gpu = main_gpu
|
|
852
857
|
self.tensor_split = tensor_split
|
|
853
858
|
self._c_tensor_split = None
|
|
@@ -866,6 +871,34 @@ class Llama:
|
|
|
866
871
|
self.model_params.use_mmap = use_mmap if lora_path is None else False
|
|
867
872
|
self.model_params.use_mlock = use_mlock
|
|
868
873
|
|
|
874
|
+
self.kv_overrides = kv_overrides
|
|
875
|
+
if kv_overrides is not None:
|
|
876
|
+
n_overrides = len(kv_overrides)
|
|
877
|
+
self._kv_overrides_array = llama_cpp.llama_model_kv_override * (n_overrides + 1)
|
|
878
|
+
self._kv_overrides_array_keys = []
|
|
879
|
+
|
|
880
|
+
for k, v in kv_overrides.items():
|
|
881
|
+
key_buf = ctypes.create_string_buffer(k.encode("utf-8"))
|
|
882
|
+
self._kv_overrides_array_keys.append(key_buf)
|
|
883
|
+
self._kv_overrides_array[i].key = key_buf
|
|
884
|
+
if isinstance(v, int):
|
|
885
|
+
self._kv_overrides_array[i].tag = llama_cpp.LLAMA_KV_OVERRIDE_INT
|
|
886
|
+
self._kv_overrides_array[i].value.int_value = v
|
|
887
|
+
elif isinstance(v, float):
|
|
888
|
+
self._kv_overrides_array[i].tag = llama_cpp.LLAMA_KV_OVERRIDE_FLOAT
|
|
889
|
+
self._kv_overrides_array[i].value.float_value = v
|
|
890
|
+
elif isinstance(v, bool):
|
|
891
|
+
self._kv_overrides_array[i].tag = llama_cpp.LLAMA_KV_OVERRIDE_BOOL
|
|
892
|
+
self._kv_overrides_array[i].value.bool_value = v
|
|
893
|
+
else:
|
|
894
|
+
raise ValueError(f"Unknown value type for {k}: {v}")
|
|
895
|
+
|
|
896
|
+
self._kv_overrides_array_sentinel_key = b'\0'
|
|
897
|
+
|
|
898
|
+
# null array sentinel
|
|
899
|
+
self._kv_overrides_array[n_overrides].key = self._kv_overrides_array_sentinel_key
|
|
900
|
+
self.model_params.kv_overrides = self._kv_overrides_array
|
|
901
|
+
|
|
869
902
|
self.n_batch = min(n_ctx, n_batch) # ???
|
|
870
903
|
self.n_threads = n_threads or max(multiprocessing.cpu_count() // 2, 1)
|
|
871
904
|
self.n_threads_batch = n_threads_batch or max(
|
|
@@ -1201,6 +1234,7 @@ class Llama:
|
|
|
1201
1234
|
mirostat_mode: int = 0,
|
|
1202
1235
|
mirostat_tau: float = 5.0,
|
|
1203
1236
|
mirostat_eta: float = 0.1,
|
|
1237
|
+
penalize_nl: bool = True,
|
|
1204
1238
|
logits_processor: Optional[LogitsProcessorList] = None,
|
|
1205
1239
|
stopping_criteria: Optional[StoppingCriteriaList] = None,
|
|
1206
1240
|
grammar: Optional[LlamaGrammar] = None,
|
|
@@ -1261,6 +1295,7 @@ class Llama:
|
|
|
1261
1295
|
mirostat_eta=mirostat_eta,
|
|
1262
1296
|
logits_processor=logits_processor,
|
|
1263
1297
|
grammar=grammar,
|
|
1298
|
+
penalize_nl=penalize_nl,
|
|
1264
1299
|
)
|
|
1265
1300
|
if stopping_criteria is not None and stopping_criteria(
|
|
1266
1301
|
self._input_ids, self._scores[-1, :]
|
|
@@ -2141,11 +2176,13 @@ class Llama:
|
|
|
2141
2176
|
model_path=self.model_path,
|
|
2142
2177
|
# Model Params
|
|
2143
2178
|
n_gpu_layers=self.model_params.n_gpu_layers,
|
|
2179
|
+
split_mode=self.model_params.split_mode,
|
|
2144
2180
|
main_gpu=self.model_params.main_gpu,
|
|
2145
2181
|
tensor_split=self.tensor_split,
|
|
2146
2182
|
vocab_only=self.model_params.vocab_only,
|
|
2147
2183
|
use_mmap=self.model_params.use_mmap,
|
|
2148
2184
|
use_mlock=self.model_params.use_mlock,
|
|
2185
|
+
kv_overrides=self.kv_overrides,
|
|
2149
2186
|
# Context Params
|
|
2150
2187
|
seed=self.context_params.seed,
|
|
2151
2188
|
n_ctx=self.context_params.n_ctx,
|
|
@@ -2183,11 +2220,13 @@ class Llama:
|
|
|
2183
2220
|
model_path=state["model_path"],
|
|
2184
2221
|
# Model Params
|
|
2185
2222
|
n_gpu_layers=state["n_gpu_layers"],
|
|
2223
|
+
split_mode=state["split_mode"],
|
|
2186
2224
|
main_gpu=state["main_gpu"],
|
|
2187
2225
|
tensor_split=state["tensor_split"],
|
|
2188
2226
|
vocab_only=state["vocab_only"],
|
|
2189
2227
|
use_mmap=state["use_mmap"],
|
|
2190
2228
|
use_mlock=state["use_mlock"],
|
|
2229
|
+
kv_overrides=state["kv_overrides"],
|
|
2191
2230
|
# Context Params
|
|
2192
2231
|
seed=state["seed"],
|
|
2193
2232
|
n_ctx=state["n_ctx"],
|