@fugood/llama.node 0.6.3 → 1.0.0-beta.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CMakeLists.txt +40 -30
- package/README.md +4 -1
- package/lib/binding.js +41 -29
- package/lib/binding.ts +26 -25
- package/package.json +40 -7
- package/scripts/build.js +47 -0
- package/scripts/llama.cpp.patch +109 -0
- package/src/anyascii.c +22223 -0
- package/src/anyascii.h +42 -0
- package/src/tts_utils.cpp +20 -7
- package/src/tts_utils.h +2 -0
- package/bin/darwin/arm64/llama-node.node +0 -0
- package/bin/darwin/x64/llama-node.node +0 -0
- package/bin/linux/arm64/llama-node.node +0 -0
- package/bin/linux/x64/llama-node.node +0 -0
- package/bin/linux-cuda/arm64/llama-node.node +0 -0
- package/bin/linux-cuda/x64/llama-node.node +0 -0
- package/bin/linux-vulkan/arm64/llama-node.node +0 -0
- package/bin/linux-vulkan/x64/llama-node.node +0 -0
- package/bin/win32/x64/llama-node.node +0 -0
- package/bin/win32/x64/node.lib +0 -0
- package/bin/win32-vulkan/arm64/llama-node.node +0 -0
- package/bin/win32-vulkan/arm64/node.lib +0 -0
- package/bin/win32-vulkan/x64/llama-node.node +0 -0
- package/bin/win32-vulkan/x64/node.lib +0 -0
- package/src/llama.cpp/.github/workflows/build-linux-cross.yml +0 -233
- package/src/llama.cpp/.github/workflows/build.yml +0 -1078
- package/src/llama.cpp/.github/workflows/close-issue.yml +0 -28
- package/src/llama.cpp/.github/workflows/docker.yml +0 -178
- package/src/llama.cpp/.github/workflows/editorconfig.yml +0 -29
- package/src/llama.cpp/.github/workflows/gguf-publish.yml +0 -44
- package/src/llama.cpp/.github/workflows/labeler.yml +0 -17
- package/src/llama.cpp/.github/workflows/python-check-requirements.yml +0 -33
- package/src/llama.cpp/.github/workflows/python-lint.yml +0 -30
- package/src/llama.cpp/.github/workflows/python-type-check.yml +0 -40
- package/src/llama.cpp/.github/workflows/release.yml +0 -739
- package/src/llama.cpp/.github/workflows/server.yml +0 -237
- package/src/llama.cpp/.github/workflows/winget.yml +0 -42
- package/src/llama.cpp/cmake/arm64-apple-clang.cmake +0 -16
- package/src/llama.cpp/cmake/arm64-windows-llvm.cmake +0 -16
- package/src/llama.cpp/cmake/build-info.cmake +0 -64
- package/src/llama.cpp/cmake/common.cmake +0 -35
- package/src/llama.cpp/cmake/git-vars.cmake +0 -22
- package/src/llama.cpp/cmake/x64-windows-llvm.cmake +0 -5
- package/src/llama.cpp/common/build-info.cpp.in +0 -4
- package/src/llama.cpp/docs/build.md +0 -561
- package/src/llama.cpp/examples/CMakeLists.txt +0 -43
- package/src/llama.cpp/examples/batched/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/batched/batched.cpp +0 -246
- package/src/llama.cpp/examples/chat-13B.bat +0 -57
- package/src/llama.cpp/examples/convert-llama2c-to-ggml/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/convert-llama2c-to-ggml/convert-llama2c-to-ggml.cpp +0 -941
- package/src/llama.cpp/examples/deprecation-warning/deprecation-warning.cpp +0 -35
- package/src/llama.cpp/examples/embedding/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/embedding/embedding.cpp +0 -323
- package/src/llama.cpp/examples/eval-callback/CMakeLists.txt +0 -10
- package/src/llama.cpp/examples/eval-callback/eval-callback.cpp +0 -194
- package/src/llama.cpp/examples/gen-docs/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/gen-docs/gen-docs.cpp +0 -83
- package/src/llama.cpp/examples/gguf/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/gguf/gguf.cpp +0 -265
- package/src/llama.cpp/examples/gguf-hash/CMakeLists.txt +0 -22
- package/src/llama.cpp/examples/gguf-hash/deps/rotate-bits/rotate-bits.h +0 -46
- package/src/llama.cpp/examples/gguf-hash/deps/sha1/sha1.c +0 -295
- package/src/llama.cpp/examples/gguf-hash/deps/sha1/sha1.h +0 -52
- package/src/llama.cpp/examples/gguf-hash/deps/sha256/sha256.c +0 -221
- package/src/llama.cpp/examples/gguf-hash/deps/sha256/sha256.h +0 -24
- package/src/llama.cpp/examples/gguf-hash/deps/xxhash/xxhash.c +0 -42
- package/src/llama.cpp/examples/gguf-hash/deps/xxhash/xxhash.h +0 -7093
- package/src/llama.cpp/examples/gguf-hash/gguf-hash.cpp +0 -694
- package/src/llama.cpp/examples/gritlm/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/gritlm/gritlm.cpp +0 -229
- package/src/llama.cpp/examples/jeopardy/questions.txt +0 -100
- package/src/llama.cpp/examples/llama.android/app/build.gradle.kts +0 -65
- package/src/llama.cpp/examples/llama.android/build.gradle.kts +0 -6
- package/src/llama.cpp/examples/llama.android/llama/build.gradle.kts +0 -71
- package/src/llama.cpp/examples/llama.android/llama/src/main/cpp/CMakeLists.txt +0 -53
- package/src/llama.cpp/examples/llama.android/llama/src/main/cpp/llama-android.cpp +0 -452
- package/src/llama.cpp/examples/llama.android/settings.gradle.kts +0 -18
- package/src/llama.cpp/examples/lookahead/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/lookahead/lookahead.cpp +0 -472
- package/src/llama.cpp/examples/lookup/CMakeLists.txt +0 -23
- package/src/llama.cpp/examples/lookup/lookup-create.cpp +0 -40
- package/src/llama.cpp/examples/lookup/lookup-merge.cpp +0 -47
- package/src/llama.cpp/examples/lookup/lookup-stats.cpp +0 -157
- package/src/llama.cpp/examples/lookup/lookup.cpp +0 -242
- package/src/llama.cpp/examples/parallel/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/parallel/parallel.cpp +0 -492
- package/src/llama.cpp/examples/passkey/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/passkey/passkey.cpp +0 -277
- package/src/llama.cpp/examples/retrieval/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/retrieval/retrieval.cpp +0 -304
- package/src/llama.cpp/examples/save-load-state/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/save-load-state/save-load-state.cpp +0 -246
- package/src/llama.cpp/examples/simple/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/simple/simple.cpp +0 -206
- package/src/llama.cpp/examples/simple-chat/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/simple-chat/simple-chat.cpp +0 -206
- package/src/llama.cpp/examples/simple-cmake-pkg/CMakeLists.txt +0 -11
- package/src/llama.cpp/examples/speculative/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/speculative/speculative.cpp +0 -644
- package/src/llama.cpp/examples/speculative-simple/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/speculative-simple/speculative-simple.cpp +0 -261
- package/src/llama.cpp/examples/sycl/CMakeLists.txt +0 -9
- package/src/llama.cpp/examples/sycl/build.sh +0 -23
- package/src/llama.cpp/examples/sycl/ls-sycl-device.cpp +0 -13
- package/src/llama.cpp/examples/sycl/run-llama2.sh +0 -27
- package/src/llama.cpp/examples/sycl/run-llama3.sh +0 -28
- package/src/llama.cpp/examples/sycl/win-build-sycl.bat +0 -33
- package/src/llama.cpp/examples/sycl/win-run-llama2.bat +0 -9
- package/src/llama.cpp/examples/sycl/win-run-llama3.bat +0 -9
- package/src/llama.cpp/examples/training/CMakeLists.txt +0 -5
- package/src/llama.cpp/examples/training/finetune.cpp +0 -96
- package/src/llama.cpp/ggml/cmake/GitVars.cmake +0 -22
- package/src/llama.cpp/ggml/cmake/common.cmake +0 -26
- package/src/llama.cpp/ggml/src/ggml-alloc.c +0 -1042
- package/src/llama.cpp/ggml/src/ggml-backend-impl.h +0 -255
- package/src/llama.cpp/ggml/src/ggml-backend-reg.cpp +0 -586
- package/src/llama.cpp/ggml/src/ggml-backend.cpp +0 -2008
- package/src/llama.cpp/ggml/src/ggml-blas/CMakeLists.txt +0 -87
- package/src/llama.cpp/ggml/src/ggml-blas/ggml-blas.cpp +0 -517
- package/src/llama.cpp/ggml/src/ggml-cann/CMakeLists.txt +0 -74
- package/src/llama.cpp/ggml/src/ggml-cann/acl_tensor.cpp +0 -179
- package/src/llama.cpp/ggml/src/ggml-cann/acl_tensor.h +0 -258
- package/src/llama.cpp/ggml/src/ggml-cann/aclnn_ops.cpp +0 -2863
- package/src/llama.cpp/ggml/src/ggml-cann/aclnn_ops.h +0 -1110
- package/src/llama.cpp/ggml/src/ggml-cann/common.h +0 -420
- package/src/llama.cpp/ggml/src/ggml-cann/ggml-cann.cpp +0 -2570
- package/src/llama.cpp/ggml/src/ggml-common.h +0 -1857
- package/src/llama.cpp/ggml/src/ggml-cpu/cmake/FindSIMD.cmake +0 -100
- package/src/llama.cpp/ggml/src/ggml-cuda/CMakeLists.txt +0 -184
- package/src/llama.cpp/ggml/src/ggml-cuda/vendors/cuda.h +0 -15
- package/src/llama.cpp/ggml/src/ggml-cuda/vendors/hip.h +0 -243
- package/src/llama.cpp/ggml/src/ggml-cuda/vendors/musa.h +0 -140
- package/src/llama.cpp/ggml/src/ggml-hip/CMakeLists.txt +0 -131
- package/src/llama.cpp/ggml/src/ggml-impl.h +0 -601
- package/src/llama.cpp/ggml/src/ggml-kompute/CMakeLists.txt +0 -166
- package/src/llama.cpp/ggml/src/ggml-kompute/ggml-kompute.cpp +0 -2251
- package/src/llama.cpp/ggml/src/ggml-metal/CMakeLists.txt +0 -120
- package/src/llama.cpp/ggml/src/ggml-metal/ggml-metal-impl.h +0 -622
- package/src/llama.cpp/ggml/src/ggml-musa/CMakeLists.txt +0 -113
- package/src/llama.cpp/ggml/src/ggml-opencl/CMakeLists.txt +0 -96
- package/src/llama.cpp/ggml/src/ggml-opencl/ggml-opencl.cpp +0 -5124
- package/src/llama.cpp/ggml/src/ggml-opt.cpp +0 -1037
- package/src/llama.cpp/ggml/src/ggml-quants.c +0 -5232
- package/src/llama.cpp/ggml/src/ggml-quants.h +0 -100
- package/src/llama.cpp/ggml/src/ggml-rpc/CMakeLists.txt +0 -9
- package/src/llama.cpp/ggml/src/ggml-rpc/ggml-rpc.cpp +0 -1813
- package/src/llama.cpp/ggml/src/ggml-sycl/CMakeLists.txt +0 -189
- package/src/llama.cpp/ggml/src/ggml-sycl/backend.hpp +0 -37
- package/src/llama.cpp/ggml/src/ggml-sycl/binbcast.cpp +0 -239
- package/src/llama.cpp/ggml/src/ggml-sycl/binbcast.hpp +0 -39
- package/src/llama.cpp/ggml/src/ggml-sycl/common.cpp +0 -83
- package/src/llama.cpp/ggml/src/ggml-sycl/common.hpp +0 -493
- package/src/llama.cpp/ggml/src/ggml-sycl/concat.cpp +0 -197
- package/src/llama.cpp/ggml/src/ggml-sycl/concat.hpp +0 -20
- package/src/llama.cpp/ggml/src/ggml-sycl/conv.cpp +0 -100
- package/src/llama.cpp/ggml/src/ggml-sycl/conv.hpp +0 -20
- package/src/llama.cpp/ggml/src/ggml-sycl/convert.cpp +0 -623
- package/src/llama.cpp/ggml/src/ggml-sycl/convert.hpp +0 -34
- package/src/llama.cpp/ggml/src/ggml-sycl/cpy.cpp +0 -701
- package/src/llama.cpp/ggml/src/ggml-sycl/cpy.hpp +0 -11
- package/src/llama.cpp/ggml/src/ggml-sycl/dequantize.hpp +0 -791
- package/src/llama.cpp/ggml/src/ggml-sycl/dmmv.cpp +0 -1160
- package/src/llama.cpp/ggml/src/ggml-sycl/dmmv.hpp +0 -27
- package/src/llama.cpp/ggml/src/ggml-sycl/dpct/helper.hpp +0 -2957
- package/src/llama.cpp/ggml/src/ggml-sycl/element_wise.cpp +0 -1536
- package/src/llama.cpp/ggml/src/ggml-sycl/element_wise.hpp +0 -75
- package/src/llama.cpp/ggml/src/ggml-sycl/gemm.hpp +0 -99
- package/src/llama.cpp/ggml/src/ggml-sycl/getrows.cpp +0 -311
- package/src/llama.cpp/ggml/src/ggml-sycl/getrows.hpp +0 -20
- package/src/llama.cpp/ggml/src/ggml-sycl/ggml-sycl.cpp +0 -4443
- package/src/llama.cpp/ggml/src/ggml-sycl/gla.cpp +0 -105
- package/src/llama.cpp/ggml/src/ggml-sycl/gla.hpp +0 -8
- package/src/llama.cpp/ggml/src/ggml-sycl/im2col.cpp +0 -136
- package/src/llama.cpp/ggml/src/ggml-sycl/im2col.hpp +0 -21
- package/src/llama.cpp/ggml/src/ggml-sycl/mmq.cpp +0 -3030
- package/src/llama.cpp/ggml/src/ggml-sycl/mmq.hpp +0 -33
- package/src/llama.cpp/ggml/src/ggml-sycl/mmvq.cpp +0 -1108
- package/src/llama.cpp/ggml/src/ggml-sycl/mmvq.hpp +0 -27
- package/src/llama.cpp/ggml/src/ggml-sycl/norm.cpp +0 -474
- package/src/llama.cpp/ggml/src/ggml-sycl/norm.hpp +0 -26
- package/src/llama.cpp/ggml/src/ggml-sycl/outprod.cpp +0 -46
- package/src/llama.cpp/ggml/src/ggml-sycl/outprod.hpp +0 -10
- package/src/llama.cpp/ggml/src/ggml-sycl/presets.hpp +0 -74
- package/src/llama.cpp/ggml/src/ggml-sycl/quants.hpp +0 -83
- package/src/llama.cpp/ggml/src/ggml-sycl/rope.cpp +0 -362
- package/src/llama.cpp/ggml/src/ggml-sycl/rope.hpp +0 -20
- package/src/llama.cpp/ggml/src/ggml-sycl/softmax.cpp +0 -264
- package/src/llama.cpp/ggml/src/ggml-sycl/softmax.hpp +0 -20
- package/src/llama.cpp/ggml/src/ggml-sycl/sycl_hw.cpp +0 -13
- package/src/llama.cpp/ggml/src/ggml-sycl/sycl_hw.hpp +0 -23
- package/src/llama.cpp/ggml/src/ggml-sycl/tsembd.cpp +0 -73
- package/src/llama.cpp/ggml/src/ggml-sycl/tsembd.hpp +0 -20
- package/src/llama.cpp/ggml/src/ggml-sycl/vecdotq.hpp +0 -1215
- package/src/llama.cpp/ggml/src/ggml-sycl/wkv.cpp +0 -305
- package/src/llama.cpp/ggml/src/ggml-sycl/wkv.hpp +0 -10
- package/src/llama.cpp/ggml/src/ggml-threading.cpp +0 -12
- package/src/llama.cpp/ggml/src/ggml-threading.h +0 -14
- package/src/llama.cpp/ggml/src/ggml-vulkan/CMakeLists.txt +0 -196
- package/src/llama.cpp/ggml/src/ggml-vulkan/ggml-vulkan.cpp +0 -10699
- package/src/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/CMakeLists.txt +0 -39
- package/src/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp +0 -751
- package/src/llama.cpp/ggml/src/ggml.c +0 -6550
- package/src/llama.cpp/ggml/src/gguf.cpp +0 -1330
- package/src/llama.cpp/models/.editorconfig +0 -1
- package/src/llama.cpp/models/ggml-vocab-aquila.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-baichuan.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-bert-bge.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-bert-bge.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-bert-bge.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-chameleon.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-chameleon.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-command-r.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-command-r.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-command-r.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-deepseek-coder.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-deepseek-coder.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-deepseek-coder.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-deepseek-llm.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-deepseek-llm.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-deepseek-llm.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-deepseek-r1-qwen.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-deepseek-r1-qwen.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-falcon.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-falcon.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-falcon.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-gpt-2.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-gpt-2.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-gpt-2.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-gpt-4o.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-gpt-4o.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-gpt-neox.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-llama-bpe.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-llama-bpe.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-llama-bpe.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-llama-spm.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-llama-spm.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-llama-spm.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-llama4.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-llama4.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-mpt.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-mpt.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-mpt.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-phi-3.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-phi-3.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-phi-3.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-pixtral.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-pixtral.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-qwen2.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-qwen2.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-qwen2.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-refact.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-refact.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-refact.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-roberta-bpe.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-roberta-bpe.gguf.out +0 -46
- package/src/llama.cpp/models/ggml-vocab-starcoder.gguf +0 -0
- package/src/llama.cpp/models/ggml-vocab-starcoder.gguf.inp +0 -112
- package/src/llama.cpp/models/ggml-vocab-starcoder.gguf.out +0 -46
- package/src/llama.cpp/pocs/CMakeLists.txt +0 -14
- package/src/llama.cpp/pocs/vdot/CMakeLists.txt +0 -9
- package/src/llama.cpp/pocs/vdot/q8dot.cpp +0 -173
- package/src/llama.cpp/pocs/vdot/vdot.cpp +0 -311
- package/src/llama.cpp/prompts/LLM-questions.txt +0 -49
- package/src/llama.cpp/prompts/alpaca.txt +0 -1
- package/src/llama.cpp/prompts/assistant.txt +0 -31
- package/src/llama.cpp/prompts/chat-with-baichuan.txt +0 -4
- package/src/llama.cpp/prompts/chat-with-bob.txt +0 -7
- package/src/llama.cpp/prompts/chat-with-qwen.txt +0 -1
- package/src/llama.cpp/prompts/chat-with-vicuna-v0.txt +0 -7
- package/src/llama.cpp/prompts/chat-with-vicuna-v1.txt +0 -7
- package/src/llama.cpp/prompts/chat.txt +0 -28
- package/src/llama.cpp/prompts/dan-modified.txt +0 -1
- package/src/llama.cpp/prompts/dan.txt +0 -1
- package/src/llama.cpp/prompts/mnemonics.txt +0 -93
- package/src/llama.cpp/prompts/parallel-questions.txt +0 -43
- package/src/llama.cpp/prompts/reason-act.txt +0 -18
- package/src/llama.cpp/requirements/requirements-all.txt +0 -15
- package/src/llama.cpp/requirements/requirements-compare-llama-bench.txt +0 -2
- package/src/llama.cpp/requirements/requirements-convert_hf_to_gguf.txt +0 -7
- package/src/llama.cpp/requirements/requirements-convert_hf_to_gguf_update.txt +0 -7
- package/src/llama.cpp/requirements/requirements-convert_legacy_llama.txt +0 -5
- package/src/llama.cpp/requirements/requirements-convert_llama_ggml_to_gguf.txt +0 -1
- package/src/llama.cpp/requirements/requirements-convert_lora_to_gguf.txt +0 -4
- package/src/llama.cpp/requirements/requirements-gguf_editor_gui.txt +0 -3
- package/src/llama.cpp/requirements/requirements-pydantic.txt +0 -3
- package/src/llama.cpp/requirements/requirements-test-tokenizer-random.txt +0 -1
- package/src/llama.cpp/requirements/requirements-tool_bench.txt +0 -12
- package/src/llama.cpp/requirements.txt +0 -13
- package/src/llama.cpp/scripts/build-info.sh +0 -30
- package/src/llama.cpp/scripts/install-oneapi.bat +0 -19
- package/src/llama.cpp/scripts/xxd.cmake +0 -16
- package/src/llama.cpp/tests/CMakeLists.txt +0 -177
- package/src/llama.cpp/tests/get-model.cpp +0 -21
- package/src/llama.cpp/tests/get-model.h +0 -2
- package/src/llama.cpp/tests/test-arg-parser.cpp +0 -178
- package/src/llama.cpp/tests/test-autorelease.cpp +0 -24
- package/src/llama.cpp/tests/test-backend-ops.cpp +0 -4793
- package/src/llama.cpp/tests/test-barrier.cpp +0 -94
- package/src/llama.cpp/tests/test-c.c +0 -7
- package/src/llama.cpp/tests/test-chat-template.cpp +0 -417
- package/src/llama.cpp/tests/test-chat.cpp +0 -985
- package/src/llama.cpp/tests/test-double-float.cpp +0 -57
- package/src/llama.cpp/tests/test-gbnf-validator.cpp +0 -109
- package/src/llama.cpp/tests/test-gguf.cpp +0 -1338
- package/src/llama.cpp/tests/test-grammar-integration.cpp +0 -1308
- package/src/llama.cpp/tests/test-grammar-llguidance.cpp +0 -1201
- package/src/llama.cpp/tests/test-grammar-parser.cpp +0 -519
- package/src/llama.cpp/tests/test-json-schema-to-grammar.cpp +0 -1304
- package/src/llama.cpp/tests/test-llama-grammar.cpp +0 -408
- package/src/llama.cpp/tests/test-log.cpp +0 -39
- package/src/llama.cpp/tests/test-model-load-cancel.cpp +0 -27
- package/src/llama.cpp/tests/test-mtmd-c-api.c +0 -63
- package/src/llama.cpp/tests/test-opt.cpp +0 -904
- package/src/llama.cpp/tests/test-quantize-fns.cpp +0 -186
- package/src/llama.cpp/tests/test-quantize-perf.cpp +0 -365
- package/src/llama.cpp/tests/test-quantize-stats.cpp +0 -424
- package/src/llama.cpp/tests/test-regex-partial.cpp +0 -288
- package/src/llama.cpp/tests/test-rope.cpp +0 -262
- package/src/llama.cpp/tests/test-sampling.cpp +0 -399
- package/src/llama.cpp/tests/test-tokenizer-0.cpp +0 -312
- package/src/llama.cpp/tests/test-tokenizer-1-bpe.cpp +0 -155
- package/src/llama.cpp/tests/test-tokenizer-1-spm.cpp +0 -125
- package/src/llama.cpp/tools/CMakeLists.txt +0 -39
- package/src/llama.cpp/tools/batched-bench/CMakeLists.txt +0 -5
- package/src/llama.cpp/tools/batched-bench/batched-bench.cpp +0 -204
- package/src/llama.cpp/tools/cvector-generator/CMakeLists.txt +0 -5
- package/src/llama.cpp/tools/cvector-generator/completions.txt +0 -582
- package/src/llama.cpp/tools/cvector-generator/cvector-generator.cpp +0 -508
- package/src/llama.cpp/tools/cvector-generator/mean.hpp +0 -48
- package/src/llama.cpp/tools/cvector-generator/negative.txt +0 -4
- package/src/llama.cpp/tools/cvector-generator/pca.hpp +0 -315
- package/src/llama.cpp/tools/cvector-generator/positive.txt +0 -4
- package/src/llama.cpp/tools/export-lora/CMakeLists.txt +0 -5
- package/src/llama.cpp/tools/export-lora/export-lora.cpp +0 -434
- package/src/llama.cpp/tools/gguf-split/CMakeLists.txt +0 -5
- package/src/llama.cpp/tools/gguf-split/gguf-split.cpp +0 -583
- package/src/llama.cpp/tools/imatrix/CMakeLists.txt +0 -5
- package/src/llama.cpp/tools/imatrix/imatrix.cpp +0 -667
- package/src/llama.cpp/tools/llama-bench/CMakeLists.txt +0 -5
- package/src/llama.cpp/tools/llama-bench/llama-bench.cpp +0 -2024
- package/src/llama.cpp/tools/main/CMakeLists.txt +0 -5
- package/src/llama.cpp/tools/main/main.cpp +0 -977
- package/src/llama.cpp/tools/mtmd/CMakeLists.txt +0 -58
- package/src/llama.cpp/tools/mtmd/clip-impl.h +0 -462
- package/src/llama.cpp/tools/mtmd/clip.cpp +0 -4024
- package/src/llama.cpp/tools/mtmd/clip.h +0 -101
- package/src/llama.cpp/tools/mtmd/deprecation-warning.cpp +0 -22
- package/src/llama.cpp/tools/mtmd/miniaudio.h +0 -93468
- package/src/llama.cpp/tools/mtmd/mtmd-audio.cpp +0 -855
- package/src/llama.cpp/tools/mtmd/mtmd-audio.h +0 -62
- package/src/llama.cpp/tools/mtmd/mtmd-cli.cpp +0 -377
- package/src/llama.cpp/tools/mtmd/mtmd-helper.cpp +0 -297
- package/src/llama.cpp/tools/mtmd/mtmd.cpp +0 -942
- package/src/llama.cpp/tools/mtmd/mtmd.h +0 -362
- package/src/llama.cpp/tools/mtmd/requirements.txt +0 -5
- package/src/llama.cpp/tools/perplexity/CMakeLists.txt +0 -5
- package/src/llama.cpp/tools/perplexity/perplexity.cpp +0 -2063
- package/src/llama.cpp/tools/quantize/CMakeLists.txt +0 -6
- package/src/llama.cpp/tools/quantize/quantize.cpp +0 -519
- package/src/llama.cpp/tools/rpc/CMakeLists.txt +0 -4
- package/src/llama.cpp/tools/rpc/rpc-server.cpp +0 -322
- package/src/llama.cpp/tools/run/CMakeLists.txt +0 -16
- package/src/llama.cpp/tools/run/linenoise.cpp/linenoise.cpp +0 -1995
- package/src/llama.cpp/tools/run/linenoise.cpp/linenoise.h +0 -137
- package/src/llama.cpp/tools/run/run.cpp +0 -1261
- package/src/llama.cpp/tools/server/CMakeLists.txt +0 -51
- package/src/llama.cpp/tools/server/bench/requirements.txt +0 -2
- package/src/llama.cpp/tools/server/httplib.h +0 -10506
- package/src/llama.cpp/tools/server/server.cpp +0 -4966
- package/src/llama.cpp/tools/server/tests/requirements.txt +0 -8
- package/src/llama.cpp/tools/server/utils.hpp +0 -1337
- package/src/llama.cpp/tools/tokenize/CMakeLists.txt +0 -5
- package/src/llama.cpp/tools/tokenize/tokenize.cpp +0 -416
- package/src/llama.cpp/tools/tts/CMakeLists.txt +0 -5
- package/src/llama.cpp/tools/tts/tts.cpp +0 -1092
|
@@ -1,112 +0,0 @@
|
|
|
1
|
-
ied 4 ½ months
|
|
2
|
-
__ggml_vocab_test__
|
|
3
|
-
Führer
|
|
4
|
-
__ggml_vocab_test__
|
|
5
|
-
|
|
6
|
-
__ggml_vocab_test__
|
|
7
|
-
|
|
8
|
-
__ggml_vocab_test__
|
|
9
|
-
|
|
10
|
-
__ggml_vocab_test__
|
|
11
|
-
|
|
12
|
-
__ggml_vocab_test__
|
|
13
|
-
|
|
14
|
-
__ggml_vocab_test__
|
|
15
|
-
|
|
16
|
-
|
|
17
|
-
__ggml_vocab_test__
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
__ggml_vocab_test__
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
__ggml_vocab_test__
|
|
27
|
-
|
|
28
|
-
|
|
29
|
-
__ggml_vocab_test__
|
|
30
|
-
Hello world
|
|
31
|
-
__ggml_vocab_test__
|
|
32
|
-
Hello world
|
|
33
|
-
__ggml_vocab_test__
|
|
34
|
-
Hello World
|
|
35
|
-
__ggml_vocab_test__
|
|
36
|
-
Hello World
|
|
37
|
-
__ggml_vocab_test__
|
|
38
|
-
Hello World!
|
|
39
|
-
__ggml_vocab_test__
|
|
40
|
-
Hello, world!
|
|
41
|
-
__ggml_vocab_test__
|
|
42
|
-
Hello, world!
|
|
43
|
-
__ggml_vocab_test__
|
|
44
|
-
this is 🦙.cpp
|
|
45
|
-
__ggml_vocab_test__
|
|
46
|
-
w048 7tuijk dsdfhu
|
|
47
|
-
__ggml_vocab_test__
|
|
48
|
-
нещо на Български
|
|
49
|
-
__ggml_vocab_test__
|
|
50
|
-
កាន់តែពិសេសអាចខលចេញ
|
|
51
|
-
__ggml_vocab_test__
|
|
52
|
-
🚀 (normal) 😶🌫️ (multiple emojis concatenated) ✅ (only emoji that has its own token)
|
|
53
|
-
__ggml_vocab_test__
|
|
54
|
-
Hello
|
|
55
|
-
__ggml_vocab_test__
|
|
56
|
-
Hello
|
|
57
|
-
__ggml_vocab_test__
|
|
58
|
-
Hello
|
|
59
|
-
__ggml_vocab_test__
|
|
60
|
-
Hello
|
|
61
|
-
__ggml_vocab_test__
|
|
62
|
-
Hello
|
|
63
|
-
__ggml_vocab_test__
|
|
64
|
-
Hello
|
|
65
|
-
Hello
|
|
66
|
-
__ggml_vocab_test__
|
|
67
|
-
(
|
|
68
|
-
__ggml_vocab_test__
|
|
69
|
-
|
|
70
|
-
=
|
|
71
|
-
__ggml_vocab_test__
|
|
72
|
-
' era
|
|
73
|
-
__ggml_vocab_test__
|
|
74
|
-
Hello, y'all! How are you 😁 ?我想在apple工作1314151天~
|
|
75
|
-
__ggml_vocab_test__
|
|
76
|
-
!!!!!!
|
|
77
|
-
__ggml_vocab_test__
|
|
78
|
-
3
|
|
79
|
-
__ggml_vocab_test__
|
|
80
|
-
33
|
|
81
|
-
__ggml_vocab_test__
|
|
82
|
-
333
|
|
83
|
-
__ggml_vocab_test__
|
|
84
|
-
3333
|
|
85
|
-
__ggml_vocab_test__
|
|
86
|
-
33333
|
|
87
|
-
__ggml_vocab_test__
|
|
88
|
-
333333
|
|
89
|
-
__ggml_vocab_test__
|
|
90
|
-
3333333
|
|
91
|
-
__ggml_vocab_test__
|
|
92
|
-
33333333
|
|
93
|
-
__ggml_vocab_test__
|
|
94
|
-
333333333
|
|
95
|
-
__ggml_vocab_test__
|
|
96
|
-
Cửa Việt
|
|
97
|
-
__ggml_vocab_test__
|
|
98
|
-
discards
|
|
99
|
-
__ggml_vocab_test__
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
|
|
111
|
-
🚀 (normal) 😶🌫️ (multiple emojis concatenated) ✅ 🦙🦙 3 33 333 3333 33333 333333 3333333 33333333 3.3 3..3 3...3 កាន់តែពិសេសអាច😁 ?我想在apple工作1314151天~ ------======= нещо на Български ''''''```````""""......!!!!!!?????? I've been 'told he's there, 'RE you sure? 'M not sure I'll make it, 'D you like some tea? We'Ve a'lL
|
|
112
|
-
__ggml_vocab_test__
|
|
@@ -1,46 +0,0 @@
|
|
|
1
|
-
4833 225 38 225 143 140 17723
|
|
2
|
-
56 2006 3935 265
|
|
3
|
-
|
|
4
|
-
225
|
|
5
|
-
261
|
|
6
|
-
264
|
|
7
|
-
202
|
|
8
|
-
203
|
|
9
|
-
478
|
|
10
|
-
2831
|
|
11
|
-
15773
|
|
12
|
-
8279 5788
|
|
13
|
-
12000 5788
|
|
14
|
-
8279 10896
|
|
15
|
-
12000 10896
|
|
16
|
-
12000 10896 19
|
|
17
|
-
8279 30 5788 19
|
|
18
|
-
12000 30 5788 19
|
|
19
|
-
458 438 5945 118 252 32 3766
|
|
20
|
-
105 34 38 42 225 41 102 1707 12530 10180 1479 8278
|
|
21
|
-
39862 8372 1039 9446 40242 13852 2053 8949 12531 1520 10700
|
|
22
|
-
14574 227 14574 133 14574 246 30457 238 14574 242 30457 229 14574 249 14574 134 14574 258 30457 228 14574 258 14574 114 14574 133 14574 232 14574 228 14574 254 14574 232 30457 228 14574 236
|
|
23
|
-
3807 253 227 308 4382 27 18458 133 46113 44967 123 13868 308 12565 19775 33071 40824 733 27 41889 308 2585 22680 688 1401 2819 4369 2404 27
|
|
24
|
-
8279
|
|
25
|
-
12000
|
|
26
|
-
225 12000
|
|
27
|
-
261 12000
|
|
28
|
-
264 12000
|
|
29
|
-
264 12000 284 12000
|
|
30
|
-
308
|
|
31
|
-
203 280
|
|
32
|
-
25 34666
|
|
33
|
-
8279 30 533 25 464 19 4971 884 844 18458 228 1018 4982 13368 2909 9513 17827 35 37 35 38 35 39 35 11873 47838
|
|
34
|
-
9163 3202
|
|
35
|
-
37
|
|
36
|
-
37 37
|
|
37
|
-
37 37 37
|
|
38
|
-
37 37 37 37
|
|
39
|
-
37 37 37 37 37
|
|
40
|
-
37 37 37 37 37 37
|
|
41
|
-
37 37 37 37 37 37 37
|
|
42
|
-
37 37 37 37 37 37 37 37
|
|
43
|
-
37 37 37 37 37 37 37 37 37
|
|
44
|
-
53 33934 83 33217 17102 102
|
|
45
|
-
1214 12258
|
|
46
|
-
334 719 8878 202 10885 4222 16104 28570 203 3807 253 227 308 4382 27 18458 133 46113 44967 123 13868 308 12565 19775 33071 40824 733 27 41889 5945 118 252 3807 118 252 225 37 225 37 37 225 37 37 37 225 37 37 37 37 225 37 37 37 37 37 225 37 37 37 37 37 37 225 37 37 37 37 37 37 37 225 37 37 37 37 37 37 37 37 225 37 32 37 225 37 497 37 225 37 1179 37 225 14574 227 14574 133 14574 246 30457 238 14574 242 30457 229 14574 249 14574 134 14574 258 30457 228 14574 258 14574 114 14574 133 14574 232 36628 228 1018 4982 13368 2909 9513 17827 35 37 35 38 35 39 35 11873 47838 20921 16623 13028 8372 1039 9446 40242 13852 2053 8949 12531 1520 10700 5881 9592 13299 914 31753 31359 9163 3202 35472 10397 439 4763 2583 330 102 1455 938 1182 2017 30 330 613 844 3654 49 330 63 646 3654 439 4621 1930 561 30 330 54 844 2124 1629 35993 49 2688 25 7709 312 25 94 62
|
|
@@ -1,112 +0,0 @@
|
|
|
1
|
-
ied 4 ½ months
|
|
2
|
-
__ggml_vocab_test__
|
|
3
|
-
Führer
|
|
4
|
-
__ggml_vocab_test__
|
|
5
|
-
|
|
6
|
-
__ggml_vocab_test__
|
|
7
|
-
|
|
8
|
-
__ggml_vocab_test__
|
|
9
|
-
|
|
10
|
-
__ggml_vocab_test__
|
|
11
|
-
|
|
12
|
-
__ggml_vocab_test__
|
|
13
|
-
|
|
14
|
-
__ggml_vocab_test__
|
|
15
|
-
|
|
16
|
-
|
|
17
|
-
__ggml_vocab_test__
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
__ggml_vocab_test__
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
__ggml_vocab_test__
|
|
27
|
-
|
|
28
|
-
|
|
29
|
-
__ggml_vocab_test__
|
|
30
|
-
Hello world
|
|
31
|
-
__ggml_vocab_test__
|
|
32
|
-
Hello world
|
|
33
|
-
__ggml_vocab_test__
|
|
34
|
-
Hello World
|
|
35
|
-
__ggml_vocab_test__
|
|
36
|
-
Hello World
|
|
37
|
-
__ggml_vocab_test__
|
|
38
|
-
Hello World!
|
|
39
|
-
__ggml_vocab_test__
|
|
40
|
-
Hello, world!
|
|
41
|
-
__ggml_vocab_test__
|
|
42
|
-
Hello, world!
|
|
43
|
-
__ggml_vocab_test__
|
|
44
|
-
this is 🦙.cpp
|
|
45
|
-
__ggml_vocab_test__
|
|
46
|
-
w048 7tuijk dsdfhu
|
|
47
|
-
__ggml_vocab_test__
|
|
48
|
-
нещо на Български
|
|
49
|
-
__ggml_vocab_test__
|
|
50
|
-
កាន់តែពិសេសអាចខលចេញ
|
|
51
|
-
__ggml_vocab_test__
|
|
52
|
-
🚀 (normal) 😶🌫️ (multiple emojis concatenated) ✅ (only emoji that has its own token)
|
|
53
|
-
__ggml_vocab_test__
|
|
54
|
-
Hello
|
|
55
|
-
__ggml_vocab_test__
|
|
56
|
-
Hello
|
|
57
|
-
__ggml_vocab_test__
|
|
58
|
-
Hello
|
|
59
|
-
__ggml_vocab_test__
|
|
60
|
-
Hello
|
|
61
|
-
__ggml_vocab_test__
|
|
62
|
-
Hello
|
|
63
|
-
__ggml_vocab_test__
|
|
64
|
-
Hello
|
|
65
|
-
Hello
|
|
66
|
-
__ggml_vocab_test__
|
|
67
|
-
(
|
|
68
|
-
__ggml_vocab_test__
|
|
69
|
-
|
|
70
|
-
=
|
|
71
|
-
__ggml_vocab_test__
|
|
72
|
-
' era
|
|
73
|
-
__ggml_vocab_test__
|
|
74
|
-
Hello, y'all! How are you 😁 ?我想在apple工作1314151天~
|
|
75
|
-
__ggml_vocab_test__
|
|
76
|
-
!!!!!!
|
|
77
|
-
__ggml_vocab_test__
|
|
78
|
-
3
|
|
79
|
-
__ggml_vocab_test__
|
|
80
|
-
33
|
|
81
|
-
__ggml_vocab_test__
|
|
82
|
-
333
|
|
83
|
-
__ggml_vocab_test__
|
|
84
|
-
3333
|
|
85
|
-
__ggml_vocab_test__
|
|
86
|
-
33333
|
|
87
|
-
__ggml_vocab_test__
|
|
88
|
-
333333
|
|
89
|
-
__ggml_vocab_test__
|
|
90
|
-
3333333
|
|
91
|
-
__ggml_vocab_test__
|
|
92
|
-
33333333
|
|
93
|
-
__ggml_vocab_test__
|
|
94
|
-
333333333
|
|
95
|
-
__ggml_vocab_test__
|
|
96
|
-
Cửa Việt
|
|
97
|
-
__ggml_vocab_test__
|
|
98
|
-
discards
|
|
99
|
-
__ggml_vocab_test__
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
|
|
111
|
-
🚀 (normal) 😶🌫️ (multiple emojis concatenated) ✅ 🦙🦙 3 33 333 3333 33333 333333 3333333 33333333 3.3 3..3 3...3 កាន់តែពិសេសអាច😁 ?我想在apple工作1314151天~ ------======= нещо на Български ''''''```````""""......!!!!!!?????? I've been 'told he's there, 'RE you sure? 'M not sure I'll make it, 'D you like some tea? We'Ve a'lL
|
|
112
|
-
__ggml_vocab_test__
|
|
@@ -1,46 +0,0 @@
|
|
|
1
|
-
2550 204 18430 377
|
|
2
|
-
597 2768 298 8564
|
|
3
|
-
|
|
4
|
-
1437
|
|
5
|
-
1437 1437
|
|
6
|
-
1437 1437 1437
|
|
7
|
-
50117
|
|
8
|
-
50118
|
|
9
|
-
50140
|
|
10
|
-
50140 50118
|
|
11
|
-
50117 50118
|
|
12
|
-
31414 232
|
|
13
|
-
20920 232
|
|
14
|
-
31414 623
|
|
15
|
-
20920 623
|
|
16
|
-
20920 623 328
|
|
17
|
-
31414 6 232 328
|
|
18
|
-
20920 6 232 328
|
|
19
|
-
42 16 8103 18164 27 4 49317
|
|
20
|
-
605 40976 262 10109 18474 385 29 36807 6455
|
|
21
|
-
36765 25482 22063 23171 34251 18697 10809 26161 18697 3602 22063 27969 40966 25417 15264 26161 24269 36709 41171 35328
|
|
22
|
-
1376 17772 7471 1376 17772 19002 1376 17772 9085 1376 4333 13859 1376 17772 9357 1376 4333 9264 1376 17772 25448 1376 17772 18400 1376 17772 4333 1376 4333 10172 1376 17772 4333 1376 17772 7258 1376 17772 19002 1376 17772 5782 1376 17772 10172 1376 17772 3726 1376 17772 5782 1376 4333 10172 1376 17772 23171
|
|
23
|
-
6569 15113 7471 36 21113 43 17841 19002 17 8384 6569 14285 4958 12605 36 34654 2841 4203 354 10146 26511 1070 43 36174 5782 36 8338 21554 14 34 63 308 19233 43
|
|
24
|
-
31414
|
|
25
|
-
20920
|
|
26
|
-
1437 20920
|
|
27
|
-
1437 1437 20920
|
|
28
|
-
1437 1437 1437 20920
|
|
29
|
-
1437 1437 1437 20920 50118 1437 1437 1437 20920
|
|
30
|
-
36
|
|
31
|
-
50118 5457
|
|
32
|
-
108 3567
|
|
33
|
-
31414 6 1423 108 1250 328 1336 32 47 17841 10172 17487 47876 3602 48617 15264 46537 11423 27326 48494 8210 49233 1558 1570 27761 49429 43251 10809 17772
|
|
34
|
-
32376 12846
|
|
35
|
-
246
|
|
36
|
-
3103
|
|
37
|
-
25631
|
|
38
|
-
46152
|
|
39
|
-
3103 25631
|
|
40
|
-
46152 3103
|
|
41
|
-
46152 25631
|
|
42
|
-
46152 46152
|
|
43
|
-
46152 3103 25631
|
|
44
|
-
347 1376 2023 12410 102 16376 1376 2023 6382 90
|
|
45
|
-
9553 5954
|
|
46
|
-
50118 1437 50140 1437 50140 50118 1437 50117 1437 50117 50117 1437 50117 50118 1437 1437 50118 1437 1437 1437 50118 1437 1437 1437 1437 50118 1437 1437 1437 1437 1437 50118 6569 15113 7471 36 21113 43 17841 19002 17 8384 6569 14285 4958 12605 36 34654 2841 4203 354 10146 26511 1070 43 36174 5782 8103 18164 27 6569 18164 27 155 2357 30242 155 25631 30242 3103 30242 25631 30242 46152 30242 3103 25631 155 4 246 155 7586 246 155 734 246 25974 17772 7471 1376 17772 19002 1376 17772 9085 1376 4333 13859 1376 17772 9357 1376 4333 9264 1376 17772 25448 1376 17772 18400 1376 17772 4333 1376 4333 10172 1376 17772 4333 1376 17772 7258 1376 17772 19002 1376 17772 5782 18636 10172 17487 47876 3602 48617 15264 46537 11423 27326 48494 8210 49233 1558 1570 27761 49429 43251 10809 17772 36738 48332 47463 18697 10809 25482 22063 23171 34251 18697 10809 26161 18697 3602 22063 27969 40966 25417 15264 26161 24269 36709 41171 35328 128 49690 108 49972 49519 12905 48149 48149 43796 32376 12846 27282 28749 38 348 57 128 41042 37 18 89 6 128 4629 47 686 116 128 448 45 686 38 581 146 24 6 128 495 47 101 103 6845 116 166 108 30660 10 108 462 574
|
|
Binary file
|
|
@@ -1,112 +0,0 @@
|
|
|
1
|
-
ied 4 ½ months
|
|
2
|
-
__ggml_vocab_test__
|
|
3
|
-
Führer
|
|
4
|
-
__ggml_vocab_test__
|
|
5
|
-
|
|
6
|
-
__ggml_vocab_test__
|
|
7
|
-
|
|
8
|
-
__ggml_vocab_test__
|
|
9
|
-
|
|
10
|
-
__ggml_vocab_test__
|
|
11
|
-
|
|
12
|
-
__ggml_vocab_test__
|
|
13
|
-
|
|
14
|
-
__ggml_vocab_test__
|
|
15
|
-
|
|
16
|
-
|
|
17
|
-
__ggml_vocab_test__
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
__ggml_vocab_test__
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
__ggml_vocab_test__
|
|
27
|
-
|
|
28
|
-
|
|
29
|
-
__ggml_vocab_test__
|
|
30
|
-
Hello world
|
|
31
|
-
__ggml_vocab_test__
|
|
32
|
-
Hello world
|
|
33
|
-
__ggml_vocab_test__
|
|
34
|
-
Hello World
|
|
35
|
-
__ggml_vocab_test__
|
|
36
|
-
Hello World
|
|
37
|
-
__ggml_vocab_test__
|
|
38
|
-
Hello World!
|
|
39
|
-
__ggml_vocab_test__
|
|
40
|
-
Hello, world!
|
|
41
|
-
__ggml_vocab_test__
|
|
42
|
-
Hello, world!
|
|
43
|
-
__ggml_vocab_test__
|
|
44
|
-
this is 🦙.cpp
|
|
45
|
-
__ggml_vocab_test__
|
|
46
|
-
w048 7tuijk dsdfhu
|
|
47
|
-
__ggml_vocab_test__
|
|
48
|
-
нещо на Български
|
|
49
|
-
__ggml_vocab_test__
|
|
50
|
-
កាន់តែពិសេសអាចខលចេញ
|
|
51
|
-
__ggml_vocab_test__
|
|
52
|
-
🚀 (normal) 😶🌫️ (multiple emojis concatenated) ✅ (only emoji that has its own token)
|
|
53
|
-
__ggml_vocab_test__
|
|
54
|
-
Hello
|
|
55
|
-
__ggml_vocab_test__
|
|
56
|
-
Hello
|
|
57
|
-
__ggml_vocab_test__
|
|
58
|
-
Hello
|
|
59
|
-
__ggml_vocab_test__
|
|
60
|
-
Hello
|
|
61
|
-
__ggml_vocab_test__
|
|
62
|
-
Hello
|
|
63
|
-
__ggml_vocab_test__
|
|
64
|
-
Hello
|
|
65
|
-
Hello
|
|
66
|
-
__ggml_vocab_test__
|
|
67
|
-
(
|
|
68
|
-
__ggml_vocab_test__
|
|
69
|
-
|
|
70
|
-
=
|
|
71
|
-
__ggml_vocab_test__
|
|
72
|
-
' era
|
|
73
|
-
__ggml_vocab_test__
|
|
74
|
-
Hello, y'all! How are you 😁 ?我想在apple工作1314151天~
|
|
75
|
-
__ggml_vocab_test__
|
|
76
|
-
!!!!!!
|
|
77
|
-
__ggml_vocab_test__
|
|
78
|
-
3
|
|
79
|
-
__ggml_vocab_test__
|
|
80
|
-
33
|
|
81
|
-
__ggml_vocab_test__
|
|
82
|
-
333
|
|
83
|
-
__ggml_vocab_test__
|
|
84
|
-
3333
|
|
85
|
-
__ggml_vocab_test__
|
|
86
|
-
33333
|
|
87
|
-
__ggml_vocab_test__
|
|
88
|
-
333333
|
|
89
|
-
__ggml_vocab_test__
|
|
90
|
-
3333333
|
|
91
|
-
__ggml_vocab_test__
|
|
92
|
-
33333333
|
|
93
|
-
__ggml_vocab_test__
|
|
94
|
-
333333333
|
|
95
|
-
__ggml_vocab_test__
|
|
96
|
-
Cửa Việt
|
|
97
|
-
__ggml_vocab_test__
|
|
98
|
-
discards
|
|
99
|
-
__ggml_vocab_test__
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
|
|
111
|
-
🚀 (normal) 😶🌫️ (multiple emojis concatenated) ✅ 🦙🦙 3 33 333 3333 33333 333333 3333333 33333333 3.3 3..3 3...3 កាន់តែពិសេសអាច😁 ?我想在apple工作1314151天~ ------======= нещо на Български ''''''```````""""......!!!!!!?????? I've been 'told he's there, 'RE you sure? 'M not sure I'll make it, 'D you like some tea? We'Ve a'lL
|
|
112
|
-
__ggml_vocab_test__
|
|
@@ -1,46 +0,0 @@
|
|
|
1
|
-
4850 244 57 244 162 159 17722
|
|
2
|
-
75 2022 3943 284
|
|
3
|
-
|
|
4
|
-
244
|
|
5
|
-
280
|
|
6
|
-
283
|
|
7
|
-
221
|
|
8
|
-
222
|
|
9
|
-
499
|
|
10
|
-
3067
|
|
11
|
-
15767
|
|
12
|
-
8302 5810
|
|
13
|
-
12009 5810
|
|
14
|
-
8302 10914
|
|
15
|
-
12009 10914
|
|
16
|
-
12009 10914 38
|
|
17
|
-
8302 49 5810 38
|
|
18
|
-
12009 49 5810 38
|
|
19
|
-
477 458 5954 137 271 51 3779
|
|
20
|
-
124 53 57 61 244 60 121 1726 12568 10240 1519 8290
|
|
21
|
-
39916 8389 1059 9504 40216 13858 2073 8983 12571 1539 10721
|
|
22
|
-
14566 246 14566 152 14566 265 30428 257 14566 261 30428 248 14566 268 14566 153 14566 277 30428 247 14566 277 14566 133 14566 152 14566 251 14566 247 14566 273 14566 251 30428 247 14566 255
|
|
23
|
-
3822 272 246 327 4434 46 18445 152 46030 45022 142 13878 327 12585 19884 33773 40920 751 46 41839 327 2605 22716 708 1421 2840 4387 2421 46
|
|
24
|
-
8302
|
|
25
|
-
12009
|
|
26
|
-
244 12009
|
|
27
|
-
280 12009
|
|
28
|
-
283 12009
|
|
29
|
-
283 12009 303 12009
|
|
30
|
-
327
|
|
31
|
-
222 299
|
|
32
|
-
44 34719
|
|
33
|
-
8302 49 553 44 483 38 4998 904 863 18445 247 1037 4995 13379 2924 9515 17823 54 56 54 57 54 58 54 11904 47892
|
|
34
|
-
9221 3226
|
|
35
|
-
56
|
|
36
|
-
56 56
|
|
37
|
-
56 56 56
|
|
38
|
-
56 56 56 56
|
|
39
|
-
56 56 56 56 56
|
|
40
|
-
56 56 56 56 56 56
|
|
41
|
-
56 56 56 56 56 56 56
|
|
42
|
-
56 56 56 56 56 56 56 56
|
|
43
|
-
56 56 56 56 56 56 56 56 56
|
|
44
|
-
72 34269 102 33245 17234 121
|
|
45
|
-
1236 12266
|
|
46
|
-
353 736 8886 221 10883 4238 16101 28540 222 3822 272 246 327 4434 46 18445 152 46030 45022 142 13878 327 12585 19884 33773 40920 751 46 41839 5954 137 271 3822 137 271 244 56 244 56 56 244 56 56 56 244 56 56 56 56 244 56 56 56 56 56 244 56 56 56 56 56 56 244 56 56 56 56 56 56 56 244 56 56 56 56 56 56 56 56 244 56 51 56 244 56 516 56 244 56 1198 56 244 14566 246 14566 152 14566 265 30428 257 14566 261 30428 248 14566 268 14566 153 14566 277 30428 247 14566 277 14566 133 14566 152 14566 251 36570 247 1037 4995 13379 2924 9515 17823 54 56 54 57 54 58 54 11904 47892 20895 16625 13047 8389 1059 9504 40216 13858 2073 8983 12571 1539 10721 5918 9643 13298 932 31723 31330 9221 3226 35426 10400 457 4783 2602 349 121 1477 957 1200 2038 49 349 632 863 3673 68 349 82 666 3673 457 4650 1949 580 49 349 73 863 2144 1649 35941 68 2726 44 7728 331 44 113 81
|
|
@@ -1,9 +0,0 @@
|
|
|
1
|
-
set(TARGET llama-vdot)
|
|
2
|
-
add_executable(${TARGET} vdot.cpp)
|
|
3
|
-
target_link_libraries(${TARGET} PRIVATE common llama ${CMAKE_THREAD_LIBS_INIT})
|
|
4
|
-
target_compile_features(${TARGET} PRIVATE cxx_std_17)
|
|
5
|
-
|
|
6
|
-
set(TARGET llama-q8dot)
|
|
7
|
-
add_executable(${TARGET} q8dot.cpp)
|
|
8
|
-
target_link_libraries(${TARGET} PRIVATE common llama ${CMAKE_THREAD_LIBS_INIT})
|
|
9
|
-
target_compile_features(${TARGET} PRIVATE cxx_std_17)
|
|
@@ -1,173 +0,0 @@
|
|
|
1
|
-
#include <cstdio>
|
|
2
|
-
#include <type_traits>
|
|
3
|
-
#include <vector>
|
|
4
|
-
#include <random>
|
|
5
|
-
#include <chrono>
|
|
6
|
-
#include <cstdlib>
|
|
7
|
-
#include <cmath>
|
|
8
|
-
#include <cassert>
|
|
9
|
-
#include <cstring>
|
|
10
|
-
#include <array>
|
|
11
|
-
#include <type_traits>
|
|
12
|
-
|
|
13
|
-
#include <ggml.h>
|
|
14
|
-
#include <ggml-cpu.h>
|
|
15
|
-
|
|
16
|
-
constexpr int kVecSize = 1 << 16;
|
|
17
|
-
|
|
18
|
-
// Copy-pasted from ggml.c
|
|
19
|
-
#define QK4_0 32
|
|
20
|
-
typedef struct {
|
|
21
|
-
float d; // delta
|
|
22
|
-
uint8_t qs[QK4_0 / 2]; // nibbles / quants
|
|
23
|
-
} block_q4_0;
|
|
24
|
-
static_assert(sizeof(block_q4_0) == sizeof(float) + QK4_0 / 2, "wrong q4_0 block size/padding");
|
|
25
|
-
|
|
26
|
-
#define QK4_1 32
|
|
27
|
-
typedef struct {
|
|
28
|
-
float d; // delta
|
|
29
|
-
float m; // min
|
|
30
|
-
uint8_t qs[QK4_1 / 2]; // nibbles / quants
|
|
31
|
-
} block_q4_1;
|
|
32
|
-
static_assert(sizeof(block_q4_1) == sizeof(float) * 2 + QK4_1 / 2, "wrong q4_1 block size/padding");
|
|
33
|
-
|
|
34
|
-
// Copy-pasted from ggml.c
|
|
35
|
-
#define QK8_0 32
|
|
36
|
-
typedef struct {
|
|
37
|
-
float d; // delta
|
|
38
|
-
float s; // d * sum(qs[i])
|
|
39
|
-
int8_t qs[QK8_0]; // quants
|
|
40
|
-
} block_q8_0;
|
|
41
|
-
static_assert(sizeof(block_q8_0) == 2*sizeof(float) + QK8_0, "wrong q8_0 block size/padding");
|
|
42
|
-
|
|
43
|
-
static_assert(QK4_1 == QK8_0, "QK4_1 and QK8_0 must be the same");
|
|
44
|
-
static_assert(QK4_0 == QK8_0, "QK4_0 and QK8_0 must be the same");
|
|
45
|
-
|
|
46
|
-
template <typename T>
|
|
47
|
-
static void fillQ4blocks(std::vector<T>& blocks, std::mt19937& rndm) {
|
|
48
|
-
for (auto& b : blocks) {
|
|
49
|
-
b.d = 1;
|
|
50
|
-
for (int i=0; i<QK4_1/2; ++i) {
|
|
51
|
-
uint8_t v1 = rndm() >> 28;
|
|
52
|
-
uint8_t v2 = rndm() >> 28;
|
|
53
|
-
b.qs[i] = v1 | (v2 << 4);
|
|
54
|
-
}
|
|
55
|
-
}
|
|
56
|
-
}
|
|
57
|
-
|
|
58
|
-
static void fillQ80blocks(std::vector<block_q8_0>& blocks, std::mt19937& rndm) {
|
|
59
|
-
for (auto& b : blocks) {
|
|
60
|
-
b.d = 1;
|
|
61
|
-
int sum = 0;
|
|
62
|
-
for (int i=0; i<QK8_0; ++i) {
|
|
63
|
-
b.qs[i] = (rndm() >> 24) - 128;
|
|
64
|
-
sum += b.qs[i];
|
|
65
|
-
}
|
|
66
|
-
b.s = b.d * sum;
|
|
67
|
-
}
|
|
68
|
-
}
|
|
69
|
-
|
|
70
|
-
static float simpleDot(const block_q4_0& x, const block_q8_0& y) {
|
|
71
|
-
int s1 = 0; //, s2 = 0;
|
|
72
|
-
for (int i=0; i<QK4_1/2; i+=2) {
|
|
73
|
-
int v1 = x.qs[i+0] & 0xf;
|
|
74
|
-
int v2 = x.qs[i+0] >> 4;
|
|
75
|
-
int v3 = x.qs[i+1] & 0xf;
|
|
76
|
-
int v4 = x.qs[i+1] >> 4;
|
|
77
|
-
int j = 2*i;
|
|
78
|
-
s1 += v1*y.qs[j] + v2*y.qs[j+1] + v3*y.qs[j+2] + v4*y.qs[j+3];
|
|
79
|
-
//s2 += y.qs[j] + y.qs[j+1] + y.qs[j+2] + y.qs[j+3];
|
|
80
|
-
}
|
|
81
|
-
return y.d * x.d * s1 - 8 * x.d * y.s;
|
|
82
|
-
//return y.d * x.d * (s1 - 8 * s2);
|
|
83
|
-
}
|
|
84
|
-
|
|
85
|
-
static float simpleDot(const block_q4_1& x, const block_q8_0& y) {
|
|
86
|
-
int s1 = 0; //, s2 = 0;
|
|
87
|
-
for (int i=0; i<QK4_1/2; i+=2) {
|
|
88
|
-
int v1 = x.qs[i+0] & 0xf;
|
|
89
|
-
int v2 = x.qs[i+0] >> 4;
|
|
90
|
-
int v3 = x.qs[i+1] & 0xf;
|
|
91
|
-
int v4 = x.qs[i+1] >> 4;
|
|
92
|
-
int j = 2*i;
|
|
93
|
-
s1 += v1*y.qs[j] + v2*y.qs[j+1] + v3*y.qs[j+2] + v4*y.qs[j+3];
|
|
94
|
-
//s2 += y.qs[j] + y.qs[j+1] + y.qs[j+2] + y.qs[j+3];
|
|
95
|
-
}
|
|
96
|
-
return y.d * x.d * s1 + y.s * x.m;
|
|
97
|
-
//return y.d * (x.d * s1 + x.m * s2);
|
|
98
|
-
}
|
|
99
|
-
|
|
100
|
-
struct Stat {
|
|
101
|
-
double sum = 0, sumt = 0, sumt2 = 0, maxt = 0;
|
|
102
|
-
int nloop = 0;
|
|
103
|
-
void addResult(double s, double t) {
|
|
104
|
-
sum += s;
|
|
105
|
-
sumt += t; sumt2 += t*t; maxt = std::max(maxt, t);
|
|
106
|
-
++nloop;
|
|
107
|
-
}
|
|
108
|
-
void reportResult(const char* title) const {
|
|
109
|
-
if (nloop < 1) {
|
|
110
|
-
printf("%s(%s): no result\n",__func__,title);
|
|
111
|
-
return;
|
|
112
|
-
}
|
|
113
|
-
printf("============ %s\n",title);
|
|
114
|
-
printf("<dot> = %g\n",sum/nloop);
|
|
115
|
-
auto t = sumt/nloop, dt = sumt2/nloop - t*t;
|
|
116
|
-
if (dt > 0) dt = sqrt(dt);
|
|
117
|
-
printf("<time> = %g +/- %g us. Max. time = %g us.\n",t,dt,maxt);
|
|
118
|
-
}
|
|
119
|
-
};
|
|
120
|
-
|
|
121
|
-
|
|
122
|
-
int main(int argc, char** argv) {
|
|
123
|
-
|
|
124
|
-
int nloop = argc > 1 ? atoi(argv[1]) : 10;
|
|
125
|
-
int type = argc > 2 ? atoi(argv[2]) : 1;
|
|
126
|
-
|
|
127
|
-
std::mt19937 rndm(1234);
|
|
128
|
-
|
|
129
|
-
std::vector<block_q4_1> x41;
|
|
130
|
-
std::vector<block_q4_0> x40;
|
|
131
|
-
std::vector<block_q8_0> y(kVecSize);
|
|
132
|
-
if (type == 0) x40.resize(kVecSize);
|
|
133
|
-
else {
|
|
134
|
-
x41.resize(kVecSize);
|
|
135
|
-
for (auto& b : x41) b.m = 1;
|
|
136
|
-
}
|
|
137
|
-
|
|
138
|
-
auto ggml_type = type == 0 ? GGML_TYPE_Q4_0 : GGML_TYPE_Q4_1;
|
|
139
|
-
|
|
140
|
-
const auto * funcs = ggml_get_type_traits_cpu(ggml_type);
|
|
141
|
-
|
|
142
|
-
Stat simple, ggml;
|
|
143
|
-
|
|
144
|
-
for (int iloop=0; iloop<nloop; ++iloop) {
|
|
145
|
-
|
|
146
|
-
if (type == 0) fillQ4blocks(x40, rndm);
|
|
147
|
-
else fillQ4blocks(x41, rndm);
|
|
148
|
-
fillQ80blocks(y, rndm);
|
|
149
|
-
|
|
150
|
-
auto t1 = std::chrono::high_resolution_clock::now();
|
|
151
|
-
double s = 0;
|
|
152
|
-
if (type == 0) for (int i=0; i<kVecSize; ++i) s += simpleDot(x40[i], y[i]);
|
|
153
|
-
else for (int i=0; i<kVecSize; ++i) s += simpleDot(x41[i], y[i]);
|
|
154
|
-
auto t2 = std::chrono::high_resolution_clock::now();
|
|
155
|
-
auto t = 1e-3*std::chrono::duration_cast<std::chrono::nanoseconds>(t2-t1).count();
|
|
156
|
-
if (iloop > 3) simple.addResult(s, t);
|
|
157
|
-
|
|
158
|
-
t1 = std::chrono::high_resolution_clock::now();
|
|
159
|
-
float fs;
|
|
160
|
-
if (type == 0) funcs->vec_dot(kVecSize * QK4_1, &fs, 0, x40.data(), 0, y.data(), 0, 1);
|
|
161
|
-
else funcs->vec_dot(kVecSize * QK4_1, &fs, 0, x41.data(), 0, y.data(), 0, 1);
|
|
162
|
-
t2 = std::chrono::high_resolution_clock::now();
|
|
163
|
-
t = 1e-3*std::chrono::duration_cast<std::chrono::nanoseconds>(t2-t1).count();
|
|
164
|
-
if (iloop > 3) ggml.addResult(fs, t);
|
|
165
|
-
|
|
166
|
-
}
|
|
167
|
-
|
|
168
|
-
// Report the time (and the average of the dot products so the compiler does not come up with the idea
|
|
169
|
-
// of optimizing away the function calls after figuring that the result is not used).
|
|
170
|
-
simple.reportResult("Simple");
|
|
171
|
-
ggml.reportResult("ggml");
|
|
172
|
-
return 0;
|
|
173
|
-
}
|