@fugood/llama.node 0.6.3 → 1.0.0-beta.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (377) hide show
  1. package/CMakeLists.txt +40 -30
  2. package/README.md +4 -1
  3. package/lib/binding.js +41 -29
  4. package/lib/binding.ts +26 -25
  5. package/package.json +40 -7
  6. package/scripts/build.js +47 -0
  7. package/scripts/llama.cpp.patch +109 -0
  8. package/src/anyascii.c +22223 -0
  9. package/src/anyascii.h +42 -0
  10. package/src/tts_utils.cpp +20 -7
  11. package/src/tts_utils.h +2 -0
  12. package/bin/darwin/arm64/llama-node.node +0 -0
  13. package/bin/darwin/x64/llama-node.node +0 -0
  14. package/bin/linux/arm64/llama-node.node +0 -0
  15. package/bin/linux/x64/llama-node.node +0 -0
  16. package/bin/linux-cuda/arm64/llama-node.node +0 -0
  17. package/bin/linux-cuda/x64/llama-node.node +0 -0
  18. package/bin/linux-vulkan/arm64/llama-node.node +0 -0
  19. package/bin/linux-vulkan/x64/llama-node.node +0 -0
  20. package/bin/win32/x64/llama-node.node +0 -0
  21. package/bin/win32/x64/node.lib +0 -0
  22. package/bin/win32-vulkan/arm64/llama-node.node +0 -0
  23. package/bin/win32-vulkan/arm64/node.lib +0 -0
  24. package/bin/win32-vulkan/x64/llama-node.node +0 -0
  25. package/bin/win32-vulkan/x64/node.lib +0 -0
  26. package/src/llama.cpp/.github/workflows/build-linux-cross.yml +0 -233
  27. package/src/llama.cpp/.github/workflows/build.yml +0 -1078
  28. package/src/llama.cpp/.github/workflows/close-issue.yml +0 -28
  29. package/src/llama.cpp/.github/workflows/docker.yml +0 -178
  30. package/src/llama.cpp/.github/workflows/editorconfig.yml +0 -29
  31. package/src/llama.cpp/.github/workflows/gguf-publish.yml +0 -44
  32. package/src/llama.cpp/.github/workflows/labeler.yml +0 -17
  33. package/src/llama.cpp/.github/workflows/python-check-requirements.yml +0 -33
  34. package/src/llama.cpp/.github/workflows/python-lint.yml +0 -30
  35. package/src/llama.cpp/.github/workflows/python-type-check.yml +0 -40
  36. package/src/llama.cpp/.github/workflows/release.yml +0 -739
  37. package/src/llama.cpp/.github/workflows/server.yml +0 -237
  38. package/src/llama.cpp/.github/workflows/winget.yml +0 -42
  39. package/src/llama.cpp/cmake/arm64-apple-clang.cmake +0 -16
  40. package/src/llama.cpp/cmake/arm64-windows-llvm.cmake +0 -16
  41. package/src/llama.cpp/cmake/build-info.cmake +0 -64
  42. package/src/llama.cpp/cmake/common.cmake +0 -35
  43. package/src/llama.cpp/cmake/git-vars.cmake +0 -22
  44. package/src/llama.cpp/cmake/x64-windows-llvm.cmake +0 -5
  45. package/src/llama.cpp/common/build-info.cpp.in +0 -4
  46. package/src/llama.cpp/docs/build.md +0 -561
  47. package/src/llama.cpp/examples/CMakeLists.txt +0 -43
  48. package/src/llama.cpp/examples/batched/CMakeLists.txt +0 -5
  49. package/src/llama.cpp/examples/batched/batched.cpp +0 -246
  50. package/src/llama.cpp/examples/chat-13B.bat +0 -57
  51. package/src/llama.cpp/examples/convert-llama2c-to-ggml/CMakeLists.txt +0 -5
  52. package/src/llama.cpp/examples/convert-llama2c-to-ggml/convert-llama2c-to-ggml.cpp +0 -941
  53. package/src/llama.cpp/examples/deprecation-warning/deprecation-warning.cpp +0 -35
  54. package/src/llama.cpp/examples/embedding/CMakeLists.txt +0 -5
  55. package/src/llama.cpp/examples/embedding/embedding.cpp +0 -323
  56. package/src/llama.cpp/examples/eval-callback/CMakeLists.txt +0 -10
  57. package/src/llama.cpp/examples/eval-callback/eval-callback.cpp +0 -194
  58. package/src/llama.cpp/examples/gen-docs/CMakeLists.txt +0 -5
  59. package/src/llama.cpp/examples/gen-docs/gen-docs.cpp +0 -83
  60. package/src/llama.cpp/examples/gguf/CMakeLists.txt +0 -5
  61. package/src/llama.cpp/examples/gguf/gguf.cpp +0 -265
  62. package/src/llama.cpp/examples/gguf-hash/CMakeLists.txt +0 -22
  63. package/src/llama.cpp/examples/gguf-hash/deps/rotate-bits/rotate-bits.h +0 -46
  64. package/src/llama.cpp/examples/gguf-hash/deps/sha1/sha1.c +0 -295
  65. package/src/llama.cpp/examples/gguf-hash/deps/sha1/sha1.h +0 -52
  66. package/src/llama.cpp/examples/gguf-hash/deps/sha256/sha256.c +0 -221
  67. package/src/llama.cpp/examples/gguf-hash/deps/sha256/sha256.h +0 -24
  68. package/src/llama.cpp/examples/gguf-hash/deps/xxhash/xxhash.c +0 -42
  69. package/src/llama.cpp/examples/gguf-hash/deps/xxhash/xxhash.h +0 -7093
  70. package/src/llama.cpp/examples/gguf-hash/gguf-hash.cpp +0 -694
  71. package/src/llama.cpp/examples/gritlm/CMakeLists.txt +0 -5
  72. package/src/llama.cpp/examples/gritlm/gritlm.cpp +0 -229
  73. package/src/llama.cpp/examples/jeopardy/questions.txt +0 -100
  74. package/src/llama.cpp/examples/llama.android/app/build.gradle.kts +0 -65
  75. package/src/llama.cpp/examples/llama.android/build.gradle.kts +0 -6
  76. package/src/llama.cpp/examples/llama.android/llama/build.gradle.kts +0 -71
  77. package/src/llama.cpp/examples/llama.android/llama/src/main/cpp/CMakeLists.txt +0 -53
  78. package/src/llama.cpp/examples/llama.android/llama/src/main/cpp/llama-android.cpp +0 -452
  79. package/src/llama.cpp/examples/llama.android/settings.gradle.kts +0 -18
  80. package/src/llama.cpp/examples/lookahead/CMakeLists.txt +0 -5
  81. package/src/llama.cpp/examples/lookahead/lookahead.cpp +0 -472
  82. package/src/llama.cpp/examples/lookup/CMakeLists.txt +0 -23
  83. package/src/llama.cpp/examples/lookup/lookup-create.cpp +0 -40
  84. package/src/llama.cpp/examples/lookup/lookup-merge.cpp +0 -47
  85. package/src/llama.cpp/examples/lookup/lookup-stats.cpp +0 -157
  86. package/src/llama.cpp/examples/lookup/lookup.cpp +0 -242
  87. package/src/llama.cpp/examples/parallel/CMakeLists.txt +0 -5
  88. package/src/llama.cpp/examples/parallel/parallel.cpp +0 -492
  89. package/src/llama.cpp/examples/passkey/CMakeLists.txt +0 -5
  90. package/src/llama.cpp/examples/passkey/passkey.cpp +0 -277
  91. package/src/llama.cpp/examples/retrieval/CMakeLists.txt +0 -5
  92. package/src/llama.cpp/examples/retrieval/retrieval.cpp +0 -304
  93. package/src/llama.cpp/examples/save-load-state/CMakeLists.txt +0 -5
  94. package/src/llama.cpp/examples/save-load-state/save-load-state.cpp +0 -246
  95. package/src/llama.cpp/examples/simple/CMakeLists.txt +0 -5
  96. package/src/llama.cpp/examples/simple/simple.cpp +0 -206
  97. package/src/llama.cpp/examples/simple-chat/CMakeLists.txt +0 -5
  98. package/src/llama.cpp/examples/simple-chat/simple-chat.cpp +0 -206
  99. package/src/llama.cpp/examples/simple-cmake-pkg/CMakeLists.txt +0 -11
  100. package/src/llama.cpp/examples/speculative/CMakeLists.txt +0 -5
  101. package/src/llama.cpp/examples/speculative/speculative.cpp +0 -644
  102. package/src/llama.cpp/examples/speculative-simple/CMakeLists.txt +0 -5
  103. package/src/llama.cpp/examples/speculative-simple/speculative-simple.cpp +0 -261
  104. package/src/llama.cpp/examples/sycl/CMakeLists.txt +0 -9
  105. package/src/llama.cpp/examples/sycl/build.sh +0 -23
  106. package/src/llama.cpp/examples/sycl/ls-sycl-device.cpp +0 -13
  107. package/src/llama.cpp/examples/sycl/run-llama2.sh +0 -27
  108. package/src/llama.cpp/examples/sycl/run-llama3.sh +0 -28
  109. package/src/llama.cpp/examples/sycl/win-build-sycl.bat +0 -33
  110. package/src/llama.cpp/examples/sycl/win-run-llama2.bat +0 -9
  111. package/src/llama.cpp/examples/sycl/win-run-llama3.bat +0 -9
  112. package/src/llama.cpp/examples/training/CMakeLists.txt +0 -5
  113. package/src/llama.cpp/examples/training/finetune.cpp +0 -96
  114. package/src/llama.cpp/ggml/cmake/GitVars.cmake +0 -22
  115. package/src/llama.cpp/ggml/cmake/common.cmake +0 -26
  116. package/src/llama.cpp/ggml/src/ggml-alloc.c +0 -1042
  117. package/src/llama.cpp/ggml/src/ggml-backend-impl.h +0 -255
  118. package/src/llama.cpp/ggml/src/ggml-backend-reg.cpp +0 -586
  119. package/src/llama.cpp/ggml/src/ggml-backend.cpp +0 -2008
  120. package/src/llama.cpp/ggml/src/ggml-blas/CMakeLists.txt +0 -87
  121. package/src/llama.cpp/ggml/src/ggml-blas/ggml-blas.cpp +0 -517
  122. package/src/llama.cpp/ggml/src/ggml-cann/CMakeLists.txt +0 -74
  123. package/src/llama.cpp/ggml/src/ggml-cann/acl_tensor.cpp +0 -179
  124. package/src/llama.cpp/ggml/src/ggml-cann/acl_tensor.h +0 -258
  125. package/src/llama.cpp/ggml/src/ggml-cann/aclnn_ops.cpp +0 -2863
  126. package/src/llama.cpp/ggml/src/ggml-cann/aclnn_ops.h +0 -1110
  127. package/src/llama.cpp/ggml/src/ggml-cann/common.h +0 -420
  128. package/src/llama.cpp/ggml/src/ggml-cann/ggml-cann.cpp +0 -2570
  129. package/src/llama.cpp/ggml/src/ggml-common.h +0 -1857
  130. package/src/llama.cpp/ggml/src/ggml-cpu/cmake/FindSIMD.cmake +0 -100
  131. package/src/llama.cpp/ggml/src/ggml-cuda/CMakeLists.txt +0 -184
  132. package/src/llama.cpp/ggml/src/ggml-cuda/vendors/cuda.h +0 -15
  133. package/src/llama.cpp/ggml/src/ggml-cuda/vendors/hip.h +0 -243
  134. package/src/llama.cpp/ggml/src/ggml-cuda/vendors/musa.h +0 -140
  135. package/src/llama.cpp/ggml/src/ggml-hip/CMakeLists.txt +0 -131
  136. package/src/llama.cpp/ggml/src/ggml-impl.h +0 -601
  137. package/src/llama.cpp/ggml/src/ggml-kompute/CMakeLists.txt +0 -166
  138. package/src/llama.cpp/ggml/src/ggml-kompute/ggml-kompute.cpp +0 -2251
  139. package/src/llama.cpp/ggml/src/ggml-metal/CMakeLists.txt +0 -120
  140. package/src/llama.cpp/ggml/src/ggml-metal/ggml-metal-impl.h +0 -622
  141. package/src/llama.cpp/ggml/src/ggml-musa/CMakeLists.txt +0 -113
  142. package/src/llama.cpp/ggml/src/ggml-opencl/CMakeLists.txt +0 -96
  143. package/src/llama.cpp/ggml/src/ggml-opencl/ggml-opencl.cpp +0 -5124
  144. package/src/llama.cpp/ggml/src/ggml-opt.cpp +0 -1037
  145. package/src/llama.cpp/ggml/src/ggml-quants.c +0 -5232
  146. package/src/llama.cpp/ggml/src/ggml-quants.h +0 -100
  147. package/src/llama.cpp/ggml/src/ggml-rpc/CMakeLists.txt +0 -9
  148. package/src/llama.cpp/ggml/src/ggml-rpc/ggml-rpc.cpp +0 -1813
  149. package/src/llama.cpp/ggml/src/ggml-sycl/CMakeLists.txt +0 -189
  150. package/src/llama.cpp/ggml/src/ggml-sycl/backend.hpp +0 -37
  151. package/src/llama.cpp/ggml/src/ggml-sycl/binbcast.cpp +0 -239
  152. package/src/llama.cpp/ggml/src/ggml-sycl/binbcast.hpp +0 -39
  153. package/src/llama.cpp/ggml/src/ggml-sycl/common.cpp +0 -83
  154. package/src/llama.cpp/ggml/src/ggml-sycl/common.hpp +0 -493
  155. package/src/llama.cpp/ggml/src/ggml-sycl/concat.cpp +0 -197
  156. package/src/llama.cpp/ggml/src/ggml-sycl/concat.hpp +0 -20
  157. package/src/llama.cpp/ggml/src/ggml-sycl/conv.cpp +0 -100
  158. package/src/llama.cpp/ggml/src/ggml-sycl/conv.hpp +0 -20
  159. package/src/llama.cpp/ggml/src/ggml-sycl/convert.cpp +0 -623
  160. package/src/llama.cpp/ggml/src/ggml-sycl/convert.hpp +0 -34
  161. package/src/llama.cpp/ggml/src/ggml-sycl/cpy.cpp +0 -701
  162. package/src/llama.cpp/ggml/src/ggml-sycl/cpy.hpp +0 -11
  163. package/src/llama.cpp/ggml/src/ggml-sycl/dequantize.hpp +0 -791
  164. package/src/llama.cpp/ggml/src/ggml-sycl/dmmv.cpp +0 -1160
  165. package/src/llama.cpp/ggml/src/ggml-sycl/dmmv.hpp +0 -27
  166. package/src/llama.cpp/ggml/src/ggml-sycl/dpct/helper.hpp +0 -2957
  167. package/src/llama.cpp/ggml/src/ggml-sycl/element_wise.cpp +0 -1536
  168. package/src/llama.cpp/ggml/src/ggml-sycl/element_wise.hpp +0 -75
  169. package/src/llama.cpp/ggml/src/ggml-sycl/gemm.hpp +0 -99
  170. package/src/llama.cpp/ggml/src/ggml-sycl/getrows.cpp +0 -311
  171. package/src/llama.cpp/ggml/src/ggml-sycl/getrows.hpp +0 -20
  172. package/src/llama.cpp/ggml/src/ggml-sycl/ggml-sycl.cpp +0 -4443
  173. package/src/llama.cpp/ggml/src/ggml-sycl/gla.cpp +0 -105
  174. package/src/llama.cpp/ggml/src/ggml-sycl/gla.hpp +0 -8
  175. package/src/llama.cpp/ggml/src/ggml-sycl/im2col.cpp +0 -136
  176. package/src/llama.cpp/ggml/src/ggml-sycl/im2col.hpp +0 -21
  177. package/src/llama.cpp/ggml/src/ggml-sycl/mmq.cpp +0 -3030
  178. package/src/llama.cpp/ggml/src/ggml-sycl/mmq.hpp +0 -33
  179. package/src/llama.cpp/ggml/src/ggml-sycl/mmvq.cpp +0 -1108
  180. package/src/llama.cpp/ggml/src/ggml-sycl/mmvq.hpp +0 -27
  181. package/src/llama.cpp/ggml/src/ggml-sycl/norm.cpp +0 -474
  182. package/src/llama.cpp/ggml/src/ggml-sycl/norm.hpp +0 -26
  183. package/src/llama.cpp/ggml/src/ggml-sycl/outprod.cpp +0 -46
  184. package/src/llama.cpp/ggml/src/ggml-sycl/outprod.hpp +0 -10
  185. package/src/llama.cpp/ggml/src/ggml-sycl/presets.hpp +0 -74
  186. package/src/llama.cpp/ggml/src/ggml-sycl/quants.hpp +0 -83
  187. package/src/llama.cpp/ggml/src/ggml-sycl/rope.cpp +0 -362
  188. package/src/llama.cpp/ggml/src/ggml-sycl/rope.hpp +0 -20
  189. package/src/llama.cpp/ggml/src/ggml-sycl/softmax.cpp +0 -264
  190. package/src/llama.cpp/ggml/src/ggml-sycl/softmax.hpp +0 -20
  191. package/src/llama.cpp/ggml/src/ggml-sycl/sycl_hw.cpp +0 -13
  192. package/src/llama.cpp/ggml/src/ggml-sycl/sycl_hw.hpp +0 -23
  193. package/src/llama.cpp/ggml/src/ggml-sycl/tsembd.cpp +0 -73
  194. package/src/llama.cpp/ggml/src/ggml-sycl/tsembd.hpp +0 -20
  195. package/src/llama.cpp/ggml/src/ggml-sycl/vecdotq.hpp +0 -1215
  196. package/src/llama.cpp/ggml/src/ggml-sycl/wkv.cpp +0 -305
  197. package/src/llama.cpp/ggml/src/ggml-sycl/wkv.hpp +0 -10
  198. package/src/llama.cpp/ggml/src/ggml-threading.cpp +0 -12
  199. package/src/llama.cpp/ggml/src/ggml-threading.h +0 -14
  200. package/src/llama.cpp/ggml/src/ggml-vulkan/CMakeLists.txt +0 -196
  201. package/src/llama.cpp/ggml/src/ggml-vulkan/ggml-vulkan.cpp +0 -10699
  202. package/src/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/CMakeLists.txt +0 -39
  203. package/src/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp +0 -751
  204. package/src/llama.cpp/ggml/src/ggml.c +0 -6550
  205. package/src/llama.cpp/ggml/src/gguf.cpp +0 -1330
  206. package/src/llama.cpp/models/.editorconfig +0 -1
  207. package/src/llama.cpp/models/ggml-vocab-aquila.gguf +0 -0
  208. package/src/llama.cpp/models/ggml-vocab-baichuan.gguf +0 -0
  209. package/src/llama.cpp/models/ggml-vocab-bert-bge.gguf +0 -0
  210. package/src/llama.cpp/models/ggml-vocab-bert-bge.gguf.inp +0 -112
  211. package/src/llama.cpp/models/ggml-vocab-bert-bge.gguf.out +0 -46
  212. package/src/llama.cpp/models/ggml-vocab-chameleon.gguf.inp +0 -112
  213. package/src/llama.cpp/models/ggml-vocab-chameleon.gguf.out +0 -46
  214. package/src/llama.cpp/models/ggml-vocab-command-r.gguf +0 -0
  215. package/src/llama.cpp/models/ggml-vocab-command-r.gguf.inp +0 -112
  216. package/src/llama.cpp/models/ggml-vocab-command-r.gguf.out +0 -46
  217. package/src/llama.cpp/models/ggml-vocab-deepseek-coder.gguf +0 -0
  218. package/src/llama.cpp/models/ggml-vocab-deepseek-coder.gguf.inp +0 -112
  219. package/src/llama.cpp/models/ggml-vocab-deepseek-coder.gguf.out +0 -46
  220. package/src/llama.cpp/models/ggml-vocab-deepseek-llm.gguf +0 -0
  221. package/src/llama.cpp/models/ggml-vocab-deepseek-llm.gguf.inp +0 -112
  222. package/src/llama.cpp/models/ggml-vocab-deepseek-llm.gguf.out +0 -46
  223. package/src/llama.cpp/models/ggml-vocab-deepseek-r1-qwen.gguf.inp +0 -112
  224. package/src/llama.cpp/models/ggml-vocab-deepseek-r1-qwen.gguf.out +0 -46
  225. package/src/llama.cpp/models/ggml-vocab-falcon.gguf +0 -0
  226. package/src/llama.cpp/models/ggml-vocab-falcon.gguf.inp +0 -112
  227. package/src/llama.cpp/models/ggml-vocab-falcon.gguf.out +0 -46
  228. package/src/llama.cpp/models/ggml-vocab-gpt-2.gguf +0 -0
  229. package/src/llama.cpp/models/ggml-vocab-gpt-2.gguf.inp +0 -112
  230. package/src/llama.cpp/models/ggml-vocab-gpt-2.gguf.out +0 -46
  231. package/src/llama.cpp/models/ggml-vocab-gpt-4o.gguf.inp +0 -112
  232. package/src/llama.cpp/models/ggml-vocab-gpt-4o.gguf.out +0 -46
  233. package/src/llama.cpp/models/ggml-vocab-gpt-neox.gguf +0 -0
  234. package/src/llama.cpp/models/ggml-vocab-llama-bpe.gguf +0 -0
  235. package/src/llama.cpp/models/ggml-vocab-llama-bpe.gguf.inp +0 -112
  236. package/src/llama.cpp/models/ggml-vocab-llama-bpe.gguf.out +0 -46
  237. package/src/llama.cpp/models/ggml-vocab-llama-spm.gguf +0 -0
  238. package/src/llama.cpp/models/ggml-vocab-llama-spm.gguf.inp +0 -112
  239. package/src/llama.cpp/models/ggml-vocab-llama-spm.gguf.out +0 -46
  240. package/src/llama.cpp/models/ggml-vocab-llama4.gguf.inp +0 -112
  241. package/src/llama.cpp/models/ggml-vocab-llama4.gguf.out +0 -46
  242. package/src/llama.cpp/models/ggml-vocab-mpt.gguf +0 -0
  243. package/src/llama.cpp/models/ggml-vocab-mpt.gguf.inp +0 -112
  244. package/src/llama.cpp/models/ggml-vocab-mpt.gguf.out +0 -46
  245. package/src/llama.cpp/models/ggml-vocab-phi-3.gguf +0 -0
  246. package/src/llama.cpp/models/ggml-vocab-phi-3.gguf.inp +0 -112
  247. package/src/llama.cpp/models/ggml-vocab-phi-3.gguf.out +0 -46
  248. package/src/llama.cpp/models/ggml-vocab-pixtral.gguf.inp +0 -112
  249. package/src/llama.cpp/models/ggml-vocab-pixtral.gguf.out +0 -46
  250. package/src/llama.cpp/models/ggml-vocab-qwen2.gguf +0 -0
  251. package/src/llama.cpp/models/ggml-vocab-qwen2.gguf.inp +0 -112
  252. package/src/llama.cpp/models/ggml-vocab-qwen2.gguf.out +0 -46
  253. package/src/llama.cpp/models/ggml-vocab-refact.gguf +0 -0
  254. package/src/llama.cpp/models/ggml-vocab-refact.gguf.inp +0 -112
  255. package/src/llama.cpp/models/ggml-vocab-refact.gguf.out +0 -46
  256. package/src/llama.cpp/models/ggml-vocab-roberta-bpe.gguf.inp +0 -112
  257. package/src/llama.cpp/models/ggml-vocab-roberta-bpe.gguf.out +0 -46
  258. package/src/llama.cpp/models/ggml-vocab-starcoder.gguf +0 -0
  259. package/src/llama.cpp/models/ggml-vocab-starcoder.gguf.inp +0 -112
  260. package/src/llama.cpp/models/ggml-vocab-starcoder.gguf.out +0 -46
  261. package/src/llama.cpp/pocs/CMakeLists.txt +0 -14
  262. package/src/llama.cpp/pocs/vdot/CMakeLists.txt +0 -9
  263. package/src/llama.cpp/pocs/vdot/q8dot.cpp +0 -173
  264. package/src/llama.cpp/pocs/vdot/vdot.cpp +0 -311
  265. package/src/llama.cpp/prompts/LLM-questions.txt +0 -49
  266. package/src/llama.cpp/prompts/alpaca.txt +0 -1
  267. package/src/llama.cpp/prompts/assistant.txt +0 -31
  268. package/src/llama.cpp/prompts/chat-with-baichuan.txt +0 -4
  269. package/src/llama.cpp/prompts/chat-with-bob.txt +0 -7
  270. package/src/llama.cpp/prompts/chat-with-qwen.txt +0 -1
  271. package/src/llama.cpp/prompts/chat-with-vicuna-v0.txt +0 -7
  272. package/src/llama.cpp/prompts/chat-with-vicuna-v1.txt +0 -7
  273. package/src/llama.cpp/prompts/chat.txt +0 -28
  274. package/src/llama.cpp/prompts/dan-modified.txt +0 -1
  275. package/src/llama.cpp/prompts/dan.txt +0 -1
  276. package/src/llama.cpp/prompts/mnemonics.txt +0 -93
  277. package/src/llama.cpp/prompts/parallel-questions.txt +0 -43
  278. package/src/llama.cpp/prompts/reason-act.txt +0 -18
  279. package/src/llama.cpp/requirements/requirements-all.txt +0 -15
  280. package/src/llama.cpp/requirements/requirements-compare-llama-bench.txt +0 -2
  281. package/src/llama.cpp/requirements/requirements-convert_hf_to_gguf.txt +0 -7
  282. package/src/llama.cpp/requirements/requirements-convert_hf_to_gguf_update.txt +0 -7
  283. package/src/llama.cpp/requirements/requirements-convert_legacy_llama.txt +0 -5
  284. package/src/llama.cpp/requirements/requirements-convert_llama_ggml_to_gguf.txt +0 -1
  285. package/src/llama.cpp/requirements/requirements-convert_lora_to_gguf.txt +0 -4
  286. package/src/llama.cpp/requirements/requirements-gguf_editor_gui.txt +0 -3
  287. package/src/llama.cpp/requirements/requirements-pydantic.txt +0 -3
  288. package/src/llama.cpp/requirements/requirements-test-tokenizer-random.txt +0 -1
  289. package/src/llama.cpp/requirements/requirements-tool_bench.txt +0 -12
  290. package/src/llama.cpp/requirements.txt +0 -13
  291. package/src/llama.cpp/scripts/build-info.sh +0 -30
  292. package/src/llama.cpp/scripts/install-oneapi.bat +0 -19
  293. package/src/llama.cpp/scripts/xxd.cmake +0 -16
  294. package/src/llama.cpp/tests/CMakeLists.txt +0 -177
  295. package/src/llama.cpp/tests/get-model.cpp +0 -21
  296. package/src/llama.cpp/tests/get-model.h +0 -2
  297. package/src/llama.cpp/tests/test-arg-parser.cpp +0 -178
  298. package/src/llama.cpp/tests/test-autorelease.cpp +0 -24
  299. package/src/llama.cpp/tests/test-backend-ops.cpp +0 -4793
  300. package/src/llama.cpp/tests/test-barrier.cpp +0 -94
  301. package/src/llama.cpp/tests/test-c.c +0 -7
  302. package/src/llama.cpp/tests/test-chat-template.cpp +0 -417
  303. package/src/llama.cpp/tests/test-chat.cpp +0 -985
  304. package/src/llama.cpp/tests/test-double-float.cpp +0 -57
  305. package/src/llama.cpp/tests/test-gbnf-validator.cpp +0 -109
  306. package/src/llama.cpp/tests/test-gguf.cpp +0 -1338
  307. package/src/llama.cpp/tests/test-grammar-integration.cpp +0 -1308
  308. package/src/llama.cpp/tests/test-grammar-llguidance.cpp +0 -1201
  309. package/src/llama.cpp/tests/test-grammar-parser.cpp +0 -519
  310. package/src/llama.cpp/tests/test-json-schema-to-grammar.cpp +0 -1304
  311. package/src/llama.cpp/tests/test-llama-grammar.cpp +0 -408
  312. package/src/llama.cpp/tests/test-log.cpp +0 -39
  313. package/src/llama.cpp/tests/test-model-load-cancel.cpp +0 -27
  314. package/src/llama.cpp/tests/test-mtmd-c-api.c +0 -63
  315. package/src/llama.cpp/tests/test-opt.cpp +0 -904
  316. package/src/llama.cpp/tests/test-quantize-fns.cpp +0 -186
  317. package/src/llama.cpp/tests/test-quantize-perf.cpp +0 -365
  318. package/src/llama.cpp/tests/test-quantize-stats.cpp +0 -424
  319. package/src/llama.cpp/tests/test-regex-partial.cpp +0 -288
  320. package/src/llama.cpp/tests/test-rope.cpp +0 -262
  321. package/src/llama.cpp/tests/test-sampling.cpp +0 -399
  322. package/src/llama.cpp/tests/test-tokenizer-0.cpp +0 -312
  323. package/src/llama.cpp/tests/test-tokenizer-1-bpe.cpp +0 -155
  324. package/src/llama.cpp/tests/test-tokenizer-1-spm.cpp +0 -125
  325. package/src/llama.cpp/tools/CMakeLists.txt +0 -39
  326. package/src/llama.cpp/tools/batched-bench/CMakeLists.txt +0 -5
  327. package/src/llama.cpp/tools/batched-bench/batched-bench.cpp +0 -204
  328. package/src/llama.cpp/tools/cvector-generator/CMakeLists.txt +0 -5
  329. package/src/llama.cpp/tools/cvector-generator/completions.txt +0 -582
  330. package/src/llama.cpp/tools/cvector-generator/cvector-generator.cpp +0 -508
  331. package/src/llama.cpp/tools/cvector-generator/mean.hpp +0 -48
  332. package/src/llama.cpp/tools/cvector-generator/negative.txt +0 -4
  333. package/src/llama.cpp/tools/cvector-generator/pca.hpp +0 -315
  334. package/src/llama.cpp/tools/cvector-generator/positive.txt +0 -4
  335. package/src/llama.cpp/tools/export-lora/CMakeLists.txt +0 -5
  336. package/src/llama.cpp/tools/export-lora/export-lora.cpp +0 -434
  337. package/src/llama.cpp/tools/gguf-split/CMakeLists.txt +0 -5
  338. package/src/llama.cpp/tools/gguf-split/gguf-split.cpp +0 -583
  339. package/src/llama.cpp/tools/imatrix/CMakeLists.txt +0 -5
  340. package/src/llama.cpp/tools/imatrix/imatrix.cpp +0 -667
  341. package/src/llama.cpp/tools/llama-bench/CMakeLists.txt +0 -5
  342. package/src/llama.cpp/tools/llama-bench/llama-bench.cpp +0 -2024
  343. package/src/llama.cpp/tools/main/CMakeLists.txt +0 -5
  344. package/src/llama.cpp/tools/main/main.cpp +0 -977
  345. package/src/llama.cpp/tools/mtmd/CMakeLists.txt +0 -58
  346. package/src/llama.cpp/tools/mtmd/clip-impl.h +0 -462
  347. package/src/llama.cpp/tools/mtmd/clip.cpp +0 -4024
  348. package/src/llama.cpp/tools/mtmd/clip.h +0 -101
  349. package/src/llama.cpp/tools/mtmd/deprecation-warning.cpp +0 -22
  350. package/src/llama.cpp/tools/mtmd/miniaudio.h +0 -93468
  351. package/src/llama.cpp/tools/mtmd/mtmd-audio.cpp +0 -855
  352. package/src/llama.cpp/tools/mtmd/mtmd-audio.h +0 -62
  353. package/src/llama.cpp/tools/mtmd/mtmd-cli.cpp +0 -377
  354. package/src/llama.cpp/tools/mtmd/mtmd-helper.cpp +0 -297
  355. package/src/llama.cpp/tools/mtmd/mtmd.cpp +0 -942
  356. package/src/llama.cpp/tools/mtmd/mtmd.h +0 -362
  357. package/src/llama.cpp/tools/mtmd/requirements.txt +0 -5
  358. package/src/llama.cpp/tools/perplexity/CMakeLists.txt +0 -5
  359. package/src/llama.cpp/tools/perplexity/perplexity.cpp +0 -2063
  360. package/src/llama.cpp/tools/quantize/CMakeLists.txt +0 -6
  361. package/src/llama.cpp/tools/quantize/quantize.cpp +0 -519
  362. package/src/llama.cpp/tools/rpc/CMakeLists.txt +0 -4
  363. package/src/llama.cpp/tools/rpc/rpc-server.cpp +0 -322
  364. package/src/llama.cpp/tools/run/CMakeLists.txt +0 -16
  365. package/src/llama.cpp/tools/run/linenoise.cpp/linenoise.cpp +0 -1995
  366. package/src/llama.cpp/tools/run/linenoise.cpp/linenoise.h +0 -137
  367. package/src/llama.cpp/tools/run/run.cpp +0 -1261
  368. package/src/llama.cpp/tools/server/CMakeLists.txt +0 -51
  369. package/src/llama.cpp/tools/server/bench/requirements.txt +0 -2
  370. package/src/llama.cpp/tools/server/httplib.h +0 -10506
  371. package/src/llama.cpp/tools/server/server.cpp +0 -4966
  372. package/src/llama.cpp/tools/server/tests/requirements.txt +0 -8
  373. package/src/llama.cpp/tools/server/utils.hpp +0 -1337
  374. package/src/llama.cpp/tools/tokenize/CMakeLists.txt +0 -5
  375. package/src/llama.cpp/tools/tokenize/tokenize.cpp +0 -416
  376. package/src/llama.cpp/tools/tts/CMakeLists.txt +0 -5
  377. package/src/llama.cpp/tools/tts/tts.cpp +0 -1092
@@ -1,112 +0,0 @@
1
- ied 4 ½ months
2
- __ggml_vocab_test__
3
- Führer
4
- __ggml_vocab_test__
5
-
6
- __ggml_vocab_test__
7
-
8
- __ggml_vocab_test__
9
-
10
- __ggml_vocab_test__
11
-
12
- __ggml_vocab_test__
13
-
14
- __ggml_vocab_test__
15
-
16
-
17
- __ggml_vocab_test__
18
-
19
-
20
-
21
- __ggml_vocab_test__
22
-
23
-
24
-
25
-
26
- __ggml_vocab_test__
27
-
28
-
29
- __ggml_vocab_test__
30
- Hello world
31
- __ggml_vocab_test__
32
- Hello world
33
- __ggml_vocab_test__
34
- Hello World
35
- __ggml_vocab_test__
36
- Hello World
37
- __ggml_vocab_test__
38
- Hello World!
39
- __ggml_vocab_test__
40
- Hello, world!
41
- __ggml_vocab_test__
42
- Hello, world!
43
- __ggml_vocab_test__
44
- this is 🦙.cpp
45
- __ggml_vocab_test__
46
- w048 7tuijk dsdfhu
47
- __ggml_vocab_test__
48
- нещо на Български
49
- __ggml_vocab_test__
50
- កាន់តែពិសេសអាចខលចេញ
51
- __ggml_vocab_test__
52
- 🚀 (normal) 😶‍🌫️ (multiple emojis concatenated) ✅ (only emoji that has its own token)
53
- __ggml_vocab_test__
54
- Hello
55
- __ggml_vocab_test__
56
- Hello
57
- __ggml_vocab_test__
58
- Hello
59
- __ggml_vocab_test__
60
- Hello
61
- __ggml_vocab_test__
62
- Hello
63
- __ggml_vocab_test__
64
- Hello
65
- Hello
66
- __ggml_vocab_test__
67
- (
68
- __ggml_vocab_test__
69
-
70
- =
71
- __ggml_vocab_test__
72
- ' era
73
- __ggml_vocab_test__
74
- Hello, y'all! How are you 😁 ?我想在apple工作1314151天~
75
- __ggml_vocab_test__
76
- !!!!!!
77
- __ggml_vocab_test__
78
- 3
79
- __ggml_vocab_test__
80
- 33
81
- __ggml_vocab_test__
82
- 333
83
- __ggml_vocab_test__
84
- 3333
85
- __ggml_vocab_test__
86
- 33333
87
- __ggml_vocab_test__
88
- 333333
89
- __ggml_vocab_test__
90
- 3333333
91
- __ggml_vocab_test__
92
- 33333333
93
- __ggml_vocab_test__
94
- 333333333
95
- __ggml_vocab_test__
96
- Cửa Việt
97
- __ggml_vocab_test__
98
- discards
99
- __ggml_vocab_test__
100
-
101
-
102
-
103
-
104
-
105
-
106
-
107
-
108
-
109
-
110
-
111
- 🚀 (normal) 😶‍🌫️ (multiple emojis concatenated) ✅ 🦙🦙 3 33 333 3333 33333 333333 3333333 33333333 3.3 3..3 3...3 កាន់តែពិសេសអាច😁 ?我想在apple工作1314151天~ ------======= нещо на Български ''''''```````""""......!!!!!!?????? I've been 'told he's there, 'RE you sure? 'M not sure I'll make it, 'D you like some tea? We'Ve a'lL
112
- __ggml_vocab_test__
@@ -1,46 +0,0 @@
1
- 4833 225 38 225 143 140 17723
2
- 56 2006 3935 265
3
-
4
- 225
5
- 261
6
- 264
7
- 202
8
- 203
9
- 478
10
- 2831
11
- 15773
12
- 8279 5788
13
- 12000 5788
14
- 8279 10896
15
- 12000 10896
16
- 12000 10896 19
17
- 8279 30 5788 19
18
- 12000 30 5788 19
19
- 458 438 5945 118 252 32 3766
20
- 105 34 38 42 225 41 102 1707 12530 10180 1479 8278
21
- 39862 8372 1039 9446 40242 13852 2053 8949 12531 1520 10700
22
- 14574 227 14574 133 14574 246 30457 238 14574 242 30457 229 14574 249 14574 134 14574 258 30457 228 14574 258 14574 114 14574 133 14574 232 14574 228 14574 254 14574 232 30457 228 14574 236
23
- 3807 253 227 308 4382 27 18458 133 46113 44967 123 13868 308 12565 19775 33071 40824 733 27 41889 308 2585 22680 688 1401 2819 4369 2404 27
24
- 8279
25
- 12000
26
- 225 12000
27
- 261 12000
28
- 264 12000
29
- 264 12000 284 12000
30
- 308
31
- 203 280
32
- 25 34666
33
- 8279 30 533 25 464 19 4971 884 844 18458 228 1018 4982 13368 2909 9513 17827 35 37 35 38 35 39 35 11873 47838
34
- 9163 3202
35
- 37
36
- 37 37
37
- 37 37 37
38
- 37 37 37 37
39
- 37 37 37 37 37
40
- 37 37 37 37 37 37
41
- 37 37 37 37 37 37 37
42
- 37 37 37 37 37 37 37 37
43
- 37 37 37 37 37 37 37 37 37
44
- 53 33934 83 33217 17102 102
45
- 1214 12258
46
- 334 719 8878 202 10885 4222 16104 28570 203 3807 253 227 308 4382 27 18458 133 46113 44967 123 13868 308 12565 19775 33071 40824 733 27 41889 5945 118 252 3807 118 252 225 37 225 37 37 225 37 37 37 225 37 37 37 37 225 37 37 37 37 37 225 37 37 37 37 37 37 225 37 37 37 37 37 37 37 225 37 37 37 37 37 37 37 37 225 37 32 37 225 37 497 37 225 37 1179 37 225 14574 227 14574 133 14574 246 30457 238 14574 242 30457 229 14574 249 14574 134 14574 258 30457 228 14574 258 14574 114 14574 133 14574 232 36628 228 1018 4982 13368 2909 9513 17827 35 37 35 38 35 39 35 11873 47838 20921 16623 13028 8372 1039 9446 40242 13852 2053 8949 12531 1520 10700 5881 9592 13299 914 31753 31359 9163 3202 35472 10397 439 4763 2583 330 102 1455 938 1182 2017 30 330 613 844 3654 49 330 63 646 3654 439 4621 1930 561 30 330 54 844 2124 1629 35993 49 2688 25 7709 312 25 94 62
@@ -1,112 +0,0 @@
1
- ied 4 ½ months
2
- __ggml_vocab_test__
3
- Führer
4
- __ggml_vocab_test__
5
-
6
- __ggml_vocab_test__
7
-
8
- __ggml_vocab_test__
9
-
10
- __ggml_vocab_test__
11
-
12
- __ggml_vocab_test__
13
-
14
- __ggml_vocab_test__
15
-
16
-
17
- __ggml_vocab_test__
18
-
19
-
20
-
21
- __ggml_vocab_test__
22
-
23
-
24
-
25
-
26
- __ggml_vocab_test__
27
-
28
-
29
- __ggml_vocab_test__
30
- Hello world
31
- __ggml_vocab_test__
32
- Hello world
33
- __ggml_vocab_test__
34
- Hello World
35
- __ggml_vocab_test__
36
- Hello World
37
- __ggml_vocab_test__
38
- Hello World!
39
- __ggml_vocab_test__
40
- Hello, world!
41
- __ggml_vocab_test__
42
- Hello, world!
43
- __ggml_vocab_test__
44
- this is 🦙.cpp
45
- __ggml_vocab_test__
46
- w048 7tuijk dsdfhu
47
- __ggml_vocab_test__
48
- нещо на Български
49
- __ggml_vocab_test__
50
- កាន់តែពិសេសអាចខលចេញ
51
- __ggml_vocab_test__
52
- 🚀 (normal) 😶‍🌫️ (multiple emojis concatenated) ✅ (only emoji that has its own token)
53
- __ggml_vocab_test__
54
- Hello
55
- __ggml_vocab_test__
56
- Hello
57
- __ggml_vocab_test__
58
- Hello
59
- __ggml_vocab_test__
60
- Hello
61
- __ggml_vocab_test__
62
- Hello
63
- __ggml_vocab_test__
64
- Hello
65
- Hello
66
- __ggml_vocab_test__
67
- (
68
- __ggml_vocab_test__
69
-
70
- =
71
- __ggml_vocab_test__
72
- ' era
73
- __ggml_vocab_test__
74
- Hello, y'all! How are you 😁 ?我想在apple工作1314151天~
75
- __ggml_vocab_test__
76
- !!!!!!
77
- __ggml_vocab_test__
78
- 3
79
- __ggml_vocab_test__
80
- 33
81
- __ggml_vocab_test__
82
- 333
83
- __ggml_vocab_test__
84
- 3333
85
- __ggml_vocab_test__
86
- 33333
87
- __ggml_vocab_test__
88
- 333333
89
- __ggml_vocab_test__
90
- 3333333
91
- __ggml_vocab_test__
92
- 33333333
93
- __ggml_vocab_test__
94
- 333333333
95
- __ggml_vocab_test__
96
- Cửa Việt
97
- __ggml_vocab_test__
98
- discards
99
- __ggml_vocab_test__
100
-
101
-
102
-
103
-
104
-
105
-
106
-
107
-
108
-
109
-
110
-
111
- 🚀 (normal) 😶‍🌫️ (multiple emojis concatenated) ✅ 🦙🦙 3 33 333 3333 33333 333333 3333333 33333333 3.3 3..3 3...3 កាន់តែពិសេសអាច😁 ?我想在apple工作1314151天~ ------======= нещо на Български ''''''```````""""......!!!!!!?????? I've been 'told he's there, 'RE you sure? 'M not sure I'll make it, 'D you like some tea? We'Ve a'lL
112
- __ggml_vocab_test__
@@ -1,46 +0,0 @@
1
- 2550 204 18430 377
2
- 597 2768 298 8564
3
-
4
- 1437
5
- 1437 1437
6
- 1437 1437 1437
7
- 50117
8
- 50118
9
- 50140
10
- 50140 50118
11
- 50117 50118
12
- 31414 232
13
- 20920 232
14
- 31414 623
15
- 20920 623
16
- 20920 623 328
17
- 31414 6 232 328
18
- 20920 6 232 328
19
- 42 16 8103 18164 27 4 49317
20
- 605 40976 262 10109 18474 385 29 36807 6455
21
- 36765 25482 22063 23171 34251 18697 10809 26161 18697 3602 22063 27969 40966 25417 15264 26161 24269 36709 41171 35328
22
- 1376 17772 7471 1376 17772 19002 1376 17772 9085 1376 4333 13859 1376 17772 9357 1376 4333 9264 1376 17772 25448 1376 17772 18400 1376 17772 4333 1376 4333 10172 1376 17772 4333 1376 17772 7258 1376 17772 19002 1376 17772 5782 1376 17772 10172 1376 17772 3726 1376 17772 5782 1376 4333 10172 1376 17772 23171
23
- 6569 15113 7471 36 21113 43 17841 19002 17 8384 6569 14285 4958 12605 36 34654 2841 4203 354 10146 26511 1070 43 36174 5782 36 8338 21554 14 34 63 308 19233 43
24
- 31414
25
- 20920
26
- 1437 20920
27
- 1437 1437 20920
28
- 1437 1437 1437 20920
29
- 1437 1437 1437 20920 50118 1437 1437 1437 20920
30
- 36
31
- 50118 5457
32
- 108 3567
33
- 31414 6 1423 108 1250 328 1336 32 47 17841 10172 17487 47876 3602 48617 15264 46537 11423 27326 48494 8210 49233 1558 1570 27761 49429 43251 10809 17772
34
- 32376 12846
35
- 246
36
- 3103
37
- 25631
38
- 46152
39
- 3103 25631
40
- 46152 3103
41
- 46152 25631
42
- 46152 46152
43
- 46152 3103 25631
44
- 347 1376 2023 12410 102 16376 1376 2023 6382 90
45
- 9553 5954
46
- 50118 1437 50140 1437 50140 50118 1437 50117 1437 50117 50117 1437 50117 50118 1437 1437 50118 1437 1437 1437 50118 1437 1437 1437 1437 50118 1437 1437 1437 1437 1437 50118 6569 15113 7471 36 21113 43 17841 19002 17 8384 6569 14285 4958 12605 36 34654 2841 4203 354 10146 26511 1070 43 36174 5782 8103 18164 27 6569 18164 27 155 2357 30242 155 25631 30242 3103 30242 25631 30242 46152 30242 3103 25631 155 4 246 155 7586 246 155 734 246 25974 17772 7471 1376 17772 19002 1376 17772 9085 1376 4333 13859 1376 17772 9357 1376 4333 9264 1376 17772 25448 1376 17772 18400 1376 17772 4333 1376 4333 10172 1376 17772 4333 1376 17772 7258 1376 17772 19002 1376 17772 5782 18636 10172 17487 47876 3602 48617 15264 46537 11423 27326 48494 8210 49233 1558 1570 27761 49429 43251 10809 17772 36738 48332 47463 18697 10809 25482 22063 23171 34251 18697 10809 26161 18697 3602 22063 27969 40966 25417 15264 26161 24269 36709 41171 35328 128 49690 108 49972 49519 12905 48149 48149 43796 32376 12846 27282 28749 38 348 57 128 41042 37 18 89 6 128 4629 47 686 116 128 448 45 686 38 581 146 24 6 128 495 47 101 103 6845 116 166 108 30660 10 108 462 574
@@ -1,112 +0,0 @@
1
- ied 4 ½ months
2
- __ggml_vocab_test__
3
- Führer
4
- __ggml_vocab_test__
5
-
6
- __ggml_vocab_test__
7
-
8
- __ggml_vocab_test__
9
-
10
- __ggml_vocab_test__
11
-
12
- __ggml_vocab_test__
13
-
14
- __ggml_vocab_test__
15
-
16
-
17
- __ggml_vocab_test__
18
-
19
-
20
-
21
- __ggml_vocab_test__
22
-
23
-
24
-
25
-
26
- __ggml_vocab_test__
27
-
28
-
29
- __ggml_vocab_test__
30
- Hello world
31
- __ggml_vocab_test__
32
- Hello world
33
- __ggml_vocab_test__
34
- Hello World
35
- __ggml_vocab_test__
36
- Hello World
37
- __ggml_vocab_test__
38
- Hello World!
39
- __ggml_vocab_test__
40
- Hello, world!
41
- __ggml_vocab_test__
42
- Hello, world!
43
- __ggml_vocab_test__
44
- this is 🦙.cpp
45
- __ggml_vocab_test__
46
- w048 7tuijk dsdfhu
47
- __ggml_vocab_test__
48
- нещо на Български
49
- __ggml_vocab_test__
50
- កាន់តែពិសេសអាចខលចេញ
51
- __ggml_vocab_test__
52
- 🚀 (normal) 😶‍🌫️ (multiple emojis concatenated) ✅ (only emoji that has its own token)
53
- __ggml_vocab_test__
54
- Hello
55
- __ggml_vocab_test__
56
- Hello
57
- __ggml_vocab_test__
58
- Hello
59
- __ggml_vocab_test__
60
- Hello
61
- __ggml_vocab_test__
62
- Hello
63
- __ggml_vocab_test__
64
- Hello
65
- Hello
66
- __ggml_vocab_test__
67
- (
68
- __ggml_vocab_test__
69
-
70
- =
71
- __ggml_vocab_test__
72
- ' era
73
- __ggml_vocab_test__
74
- Hello, y'all! How are you 😁 ?我想在apple工作1314151天~
75
- __ggml_vocab_test__
76
- !!!!!!
77
- __ggml_vocab_test__
78
- 3
79
- __ggml_vocab_test__
80
- 33
81
- __ggml_vocab_test__
82
- 333
83
- __ggml_vocab_test__
84
- 3333
85
- __ggml_vocab_test__
86
- 33333
87
- __ggml_vocab_test__
88
- 333333
89
- __ggml_vocab_test__
90
- 3333333
91
- __ggml_vocab_test__
92
- 33333333
93
- __ggml_vocab_test__
94
- 333333333
95
- __ggml_vocab_test__
96
- Cửa Việt
97
- __ggml_vocab_test__
98
- discards
99
- __ggml_vocab_test__
100
-
101
-
102
-
103
-
104
-
105
-
106
-
107
-
108
-
109
-
110
-
111
- 🚀 (normal) 😶‍🌫️ (multiple emojis concatenated) ✅ 🦙🦙 3 33 333 3333 33333 333333 3333333 33333333 3.3 3..3 3...3 កាន់តែពិសេសអាច😁 ?我想在apple工作1314151天~ ------======= нещо на Български ''''''```````""""......!!!!!!?????? I've been 'told he's there, 'RE you sure? 'M not sure I'll make it, 'D you like some tea? We'Ve a'lL
112
- __ggml_vocab_test__
@@ -1,46 +0,0 @@
1
- 4850 244 57 244 162 159 17722
2
- 75 2022 3943 284
3
-
4
- 244
5
- 280
6
- 283
7
- 221
8
- 222
9
- 499
10
- 3067
11
- 15767
12
- 8302 5810
13
- 12009 5810
14
- 8302 10914
15
- 12009 10914
16
- 12009 10914 38
17
- 8302 49 5810 38
18
- 12009 49 5810 38
19
- 477 458 5954 137 271 51 3779
20
- 124 53 57 61 244 60 121 1726 12568 10240 1519 8290
21
- 39916 8389 1059 9504 40216 13858 2073 8983 12571 1539 10721
22
- 14566 246 14566 152 14566 265 30428 257 14566 261 30428 248 14566 268 14566 153 14566 277 30428 247 14566 277 14566 133 14566 152 14566 251 14566 247 14566 273 14566 251 30428 247 14566 255
23
- 3822 272 246 327 4434 46 18445 152 46030 45022 142 13878 327 12585 19884 33773 40920 751 46 41839 327 2605 22716 708 1421 2840 4387 2421 46
24
- 8302
25
- 12009
26
- 244 12009
27
- 280 12009
28
- 283 12009
29
- 283 12009 303 12009
30
- 327
31
- 222 299
32
- 44 34719
33
- 8302 49 553 44 483 38 4998 904 863 18445 247 1037 4995 13379 2924 9515 17823 54 56 54 57 54 58 54 11904 47892
34
- 9221 3226
35
- 56
36
- 56 56
37
- 56 56 56
38
- 56 56 56 56
39
- 56 56 56 56 56
40
- 56 56 56 56 56 56
41
- 56 56 56 56 56 56 56
42
- 56 56 56 56 56 56 56 56
43
- 56 56 56 56 56 56 56 56 56
44
- 72 34269 102 33245 17234 121
45
- 1236 12266
46
- 353 736 8886 221 10883 4238 16101 28540 222 3822 272 246 327 4434 46 18445 152 46030 45022 142 13878 327 12585 19884 33773 40920 751 46 41839 5954 137 271 3822 137 271 244 56 244 56 56 244 56 56 56 244 56 56 56 56 244 56 56 56 56 56 244 56 56 56 56 56 56 244 56 56 56 56 56 56 56 244 56 56 56 56 56 56 56 56 244 56 51 56 244 56 516 56 244 56 1198 56 244 14566 246 14566 152 14566 265 30428 257 14566 261 30428 248 14566 268 14566 153 14566 277 30428 247 14566 277 14566 133 14566 152 14566 251 36570 247 1037 4995 13379 2924 9515 17823 54 56 54 57 54 58 54 11904 47892 20895 16625 13047 8389 1059 9504 40216 13858 2073 8983 12571 1539 10721 5918 9643 13298 932 31723 31330 9221 3226 35426 10400 457 4783 2602 349 121 1477 957 1200 2038 49 349 632 863 3673 68 349 82 666 3673 457 4650 1949 580 49 349 73 863 2144 1649 35941 68 2726 44 7728 331 44 113 81
@@ -1,14 +0,0 @@
1
- # dependencies
2
-
3
- find_package(Threads REQUIRED)
4
-
5
- # third-party
6
-
7
- include_directories(${CMAKE_CURRENT_SOURCE_DIR})
8
-
9
- if (EMSCRIPTEN)
10
- else()
11
- if (NOT GGML_BACKEND_DL)
12
- add_subdirectory(vdot)
13
- endif()
14
- endif()
@@ -1,9 +0,0 @@
1
- set(TARGET llama-vdot)
2
- add_executable(${TARGET} vdot.cpp)
3
- target_link_libraries(${TARGET} PRIVATE common llama ${CMAKE_THREAD_LIBS_INIT})
4
- target_compile_features(${TARGET} PRIVATE cxx_std_17)
5
-
6
- set(TARGET llama-q8dot)
7
- add_executable(${TARGET} q8dot.cpp)
8
- target_link_libraries(${TARGET} PRIVATE common llama ${CMAKE_THREAD_LIBS_INIT})
9
- target_compile_features(${TARGET} PRIVATE cxx_std_17)
@@ -1,173 +0,0 @@
1
- #include <cstdio>
2
- #include <type_traits>
3
- #include <vector>
4
- #include <random>
5
- #include <chrono>
6
- #include <cstdlib>
7
- #include <cmath>
8
- #include <cassert>
9
- #include <cstring>
10
- #include <array>
11
- #include <type_traits>
12
-
13
- #include <ggml.h>
14
- #include <ggml-cpu.h>
15
-
16
- constexpr int kVecSize = 1 << 16;
17
-
18
- // Copy-pasted from ggml.c
19
- #define QK4_0 32
20
- typedef struct {
21
- float d; // delta
22
- uint8_t qs[QK4_0 / 2]; // nibbles / quants
23
- } block_q4_0;
24
- static_assert(sizeof(block_q4_0) == sizeof(float) + QK4_0 / 2, "wrong q4_0 block size/padding");
25
-
26
- #define QK4_1 32
27
- typedef struct {
28
- float d; // delta
29
- float m; // min
30
- uint8_t qs[QK4_1 / 2]; // nibbles / quants
31
- } block_q4_1;
32
- static_assert(sizeof(block_q4_1) == sizeof(float) * 2 + QK4_1 / 2, "wrong q4_1 block size/padding");
33
-
34
- // Copy-pasted from ggml.c
35
- #define QK8_0 32
36
- typedef struct {
37
- float d; // delta
38
- float s; // d * sum(qs[i])
39
- int8_t qs[QK8_0]; // quants
40
- } block_q8_0;
41
- static_assert(sizeof(block_q8_0) == 2*sizeof(float) + QK8_0, "wrong q8_0 block size/padding");
42
-
43
- static_assert(QK4_1 == QK8_0, "QK4_1 and QK8_0 must be the same");
44
- static_assert(QK4_0 == QK8_0, "QK4_0 and QK8_0 must be the same");
45
-
46
- template <typename T>
47
- static void fillQ4blocks(std::vector<T>& blocks, std::mt19937& rndm) {
48
- for (auto& b : blocks) {
49
- b.d = 1;
50
- for (int i=0; i<QK4_1/2; ++i) {
51
- uint8_t v1 = rndm() >> 28;
52
- uint8_t v2 = rndm() >> 28;
53
- b.qs[i] = v1 | (v2 << 4);
54
- }
55
- }
56
- }
57
-
58
- static void fillQ80blocks(std::vector<block_q8_0>& blocks, std::mt19937& rndm) {
59
- for (auto& b : blocks) {
60
- b.d = 1;
61
- int sum = 0;
62
- for (int i=0; i<QK8_0; ++i) {
63
- b.qs[i] = (rndm() >> 24) - 128;
64
- sum += b.qs[i];
65
- }
66
- b.s = b.d * sum;
67
- }
68
- }
69
-
70
- static float simpleDot(const block_q4_0& x, const block_q8_0& y) {
71
- int s1 = 0; //, s2 = 0;
72
- for (int i=0; i<QK4_1/2; i+=2) {
73
- int v1 = x.qs[i+0] & 0xf;
74
- int v2 = x.qs[i+0] >> 4;
75
- int v3 = x.qs[i+1] & 0xf;
76
- int v4 = x.qs[i+1] >> 4;
77
- int j = 2*i;
78
- s1 += v1*y.qs[j] + v2*y.qs[j+1] + v3*y.qs[j+2] + v4*y.qs[j+3];
79
- //s2 += y.qs[j] + y.qs[j+1] + y.qs[j+2] + y.qs[j+3];
80
- }
81
- return y.d * x.d * s1 - 8 * x.d * y.s;
82
- //return y.d * x.d * (s1 - 8 * s2);
83
- }
84
-
85
- static float simpleDot(const block_q4_1& x, const block_q8_0& y) {
86
- int s1 = 0; //, s2 = 0;
87
- for (int i=0; i<QK4_1/2; i+=2) {
88
- int v1 = x.qs[i+0] & 0xf;
89
- int v2 = x.qs[i+0] >> 4;
90
- int v3 = x.qs[i+1] & 0xf;
91
- int v4 = x.qs[i+1] >> 4;
92
- int j = 2*i;
93
- s1 += v1*y.qs[j] + v2*y.qs[j+1] + v3*y.qs[j+2] + v4*y.qs[j+3];
94
- //s2 += y.qs[j] + y.qs[j+1] + y.qs[j+2] + y.qs[j+3];
95
- }
96
- return y.d * x.d * s1 + y.s * x.m;
97
- //return y.d * (x.d * s1 + x.m * s2);
98
- }
99
-
100
- struct Stat {
101
- double sum = 0, sumt = 0, sumt2 = 0, maxt = 0;
102
- int nloop = 0;
103
- void addResult(double s, double t) {
104
- sum += s;
105
- sumt += t; sumt2 += t*t; maxt = std::max(maxt, t);
106
- ++nloop;
107
- }
108
- void reportResult(const char* title) const {
109
- if (nloop < 1) {
110
- printf("%s(%s): no result\n",__func__,title);
111
- return;
112
- }
113
- printf("============ %s\n",title);
114
- printf("<dot> = %g\n",sum/nloop);
115
- auto t = sumt/nloop, dt = sumt2/nloop - t*t;
116
- if (dt > 0) dt = sqrt(dt);
117
- printf("<time> = %g +/- %g us. Max. time = %g us.\n",t,dt,maxt);
118
- }
119
- };
120
-
121
-
122
- int main(int argc, char** argv) {
123
-
124
- int nloop = argc > 1 ? atoi(argv[1]) : 10;
125
- int type = argc > 2 ? atoi(argv[2]) : 1;
126
-
127
- std::mt19937 rndm(1234);
128
-
129
- std::vector<block_q4_1> x41;
130
- std::vector<block_q4_0> x40;
131
- std::vector<block_q8_0> y(kVecSize);
132
- if (type == 0) x40.resize(kVecSize);
133
- else {
134
- x41.resize(kVecSize);
135
- for (auto& b : x41) b.m = 1;
136
- }
137
-
138
- auto ggml_type = type == 0 ? GGML_TYPE_Q4_0 : GGML_TYPE_Q4_1;
139
-
140
- const auto * funcs = ggml_get_type_traits_cpu(ggml_type);
141
-
142
- Stat simple, ggml;
143
-
144
- for (int iloop=0; iloop<nloop; ++iloop) {
145
-
146
- if (type == 0) fillQ4blocks(x40, rndm);
147
- else fillQ4blocks(x41, rndm);
148
- fillQ80blocks(y, rndm);
149
-
150
- auto t1 = std::chrono::high_resolution_clock::now();
151
- double s = 0;
152
- if (type == 0) for (int i=0; i<kVecSize; ++i) s += simpleDot(x40[i], y[i]);
153
- else for (int i=0; i<kVecSize; ++i) s += simpleDot(x41[i], y[i]);
154
- auto t2 = std::chrono::high_resolution_clock::now();
155
- auto t = 1e-3*std::chrono::duration_cast<std::chrono::nanoseconds>(t2-t1).count();
156
- if (iloop > 3) simple.addResult(s, t);
157
-
158
- t1 = std::chrono::high_resolution_clock::now();
159
- float fs;
160
- if (type == 0) funcs->vec_dot(kVecSize * QK4_1, &fs, 0, x40.data(), 0, y.data(), 0, 1);
161
- else funcs->vec_dot(kVecSize * QK4_1, &fs, 0, x41.data(), 0, y.data(), 0, 1);
162
- t2 = std::chrono::high_resolution_clock::now();
163
- t = 1e-3*std::chrono::duration_cast<std::chrono::nanoseconds>(t2-t1).count();
164
- if (iloop > 3) ggml.addResult(fs, t);
165
-
166
- }
167
-
168
- // Report the time (and the average of the dot products so the compiler does not come up with the idea
169
- // of optimizing away the function calls after figuring that the result is not used).
170
- simple.reportResult("Simple");
171
- ggml.reportResult("ggml");
172
- return 0;
173
- }