@fugood/llama.node 0.6.2 → 1.0.0-beta.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (378) hide show
  1. package/CMakeLists.txt +40 -30
  2. package/README.md +4 -1
  3. package/lib/binding.js +41 -29
  4. package/lib/binding.ts +26 -25
  5. package/package.json +45 -10
  6. package/scripts/build.js +47 -0
  7. package/scripts/llama.cpp.patch +109 -0
  8. package/src/anyascii.c +22223 -0
  9. package/src/anyascii.h +42 -0
  10. package/src/tts_utils.cpp +20 -7
  11. package/src/tts_utils.h +2 -0
  12. package/bin/darwin/arm64/llama-node.node +0 -0
  13. package/bin/darwin/x64/llama-node.node +0 -0
  14. package/bin/linux/arm64/llama-node.node +0 -0
  15. package/bin/linux/x64/llama-node.node +0 -0
  16. package/bin/linux-cuda/arm64/llama-node.node +0 -0
  17. package/bin/linux-cuda/x64/llama-node.node +0 -0
  18. package/bin/linux-vulkan/arm64/llama-node.node +0 -0
  19. package/bin/linux-vulkan/x64/llama-node.node +0 -0
  20. package/bin/win32/x64/llama-node.node +0 -0
  21. package/bin/win32/x64/node.lib +0 -0
  22. package/bin/win32-vulkan/arm64/llama-node.node +0 -0
  23. package/bin/win32-vulkan/arm64/node.lib +0 -0
  24. package/bin/win32-vulkan/x64/llama-node.node +0 -0
  25. package/bin/win32-vulkan/x64/node.lib +0 -0
  26. package/patches/node-api-headers+1.1.0.patch +0 -26
  27. package/src/llama.cpp/.github/workflows/build-linux-cross.yml +0 -233
  28. package/src/llama.cpp/.github/workflows/build.yml +0 -1078
  29. package/src/llama.cpp/.github/workflows/close-issue.yml +0 -28
  30. package/src/llama.cpp/.github/workflows/docker.yml +0 -178
  31. package/src/llama.cpp/.github/workflows/editorconfig.yml +0 -29
  32. package/src/llama.cpp/.github/workflows/gguf-publish.yml +0 -44
  33. package/src/llama.cpp/.github/workflows/labeler.yml +0 -17
  34. package/src/llama.cpp/.github/workflows/python-check-requirements.yml +0 -33
  35. package/src/llama.cpp/.github/workflows/python-lint.yml +0 -30
  36. package/src/llama.cpp/.github/workflows/python-type-check.yml +0 -40
  37. package/src/llama.cpp/.github/workflows/release.yml +0 -739
  38. package/src/llama.cpp/.github/workflows/server.yml +0 -237
  39. package/src/llama.cpp/.github/workflows/winget.yml +0 -42
  40. package/src/llama.cpp/cmake/arm64-apple-clang.cmake +0 -16
  41. package/src/llama.cpp/cmake/arm64-windows-llvm.cmake +0 -16
  42. package/src/llama.cpp/cmake/build-info.cmake +0 -64
  43. package/src/llama.cpp/cmake/common.cmake +0 -35
  44. package/src/llama.cpp/cmake/git-vars.cmake +0 -22
  45. package/src/llama.cpp/cmake/x64-windows-llvm.cmake +0 -5
  46. package/src/llama.cpp/common/build-info.cpp.in +0 -4
  47. package/src/llama.cpp/docs/build.md +0 -561
  48. package/src/llama.cpp/examples/CMakeLists.txt +0 -43
  49. package/src/llama.cpp/examples/batched/CMakeLists.txt +0 -5
  50. package/src/llama.cpp/examples/batched/batched.cpp +0 -246
  51. package/src/llama.cpp/examples/chat-13B.bat +0 -57
  52. package/src/llama.cpp/examples/convert-llama2c-to-ggml/CMakeLists.txt +0 -5
  53. package/src/llama.cpp/examples/convert-llama2c-to-ggml/convert-llama2c-to-ggml.cpp +0 -941
  54. package/src/llama.cpp/examples/deprecation-warning/deprecation-warning.cpp +0 -35
  55. package/src/llama.cpp/examples/embedding/CMakeLists.txt +0 -5
  56. package/src/llama.cpp/examples/embedding/embedding.cpp +0 -323
  57. package/src/llama.cpp/examples/eval-callback/CMakeLists.txt +0 -10
  58. package/src/llama.cpp/examples/eval-callback/eval-callback.cpp +0 -194
  59. package/src/llama.cpp/examples/gen-docs/CMakeLists.txt +0 -5
  60. package/src/llama.cpp/examples/gen-docs/gen-docs.cpp +0 -83
  61. package/src/llama.cpp/examples/gguf/CMakeLists.txt +0 -5
  62. package/src/llama.cpp/examples/gguf/gguf.cpp +0 -265
  63. package/src/llama.cpp/examples/gguf-hash/CMakeLists.txt +0 -22
  64. package/src/llama.cpp/examples/gguf-hash/deps/rotate-bits/rotate-bits.h +0 -46
  65. package/src/llama.cpp/examples/gguf-hash/deps/sha1/sha1.c +0 -295
  66. package/src/llama.cpp/examples/gguf-hash/deps/sha1/sha1.h +0 -52
  67. package/src/llama.cpp/examples/gguf-hash/deps/sha256/sha256.c +0 -221
  68. package/src/llama.cpp/examples/gguf-hash/deps/sha256/sha256.h +0 -24
  69. package/src/llama.cpp/examples/gguf-hash/deps/xxhash/xxhash.c +0 -42
  70. package/src/llama.cpp/examples/gguf-hash/deps/xxhash/xxhash.h +0 -7093
  71. package/src/llama.cpp/examples/gguf-hash/gguf-hash.cpp +0 -694
  72. package/src/llama.cpp/examples/gritlm/CMakeLists.txt +0 -5
  73. package/src/llama.cpp/examples/gritlm/gritlm.cpp +0 -229
  74. package/src/llama.cpp/examples/jeopardy/questions.txt +0 -100
  75. package/src/llama.cpp/examples/llama.android/app/build.gradle.kts +0 -65
  76. package/src/llama.cpp/examples/llama.android/build.gradle.kts +0 -6
  77. package/src/llama.cpp/examples/llama.android/llama/build.gradle.kts +0 -71
  78. package/src/llama.cpp/examples/llama.android/llama/src/main/cpp/CMakeLists.txt +0 -53
  79. package/src/llama.cpp/examples/llama.android/llama/src/main/cpp/llama-android.cpp +0 -452
  80. package/src/llama.cpp/examples/llama.android/settings.gradle.kts +0 -18
  81. package/src/llama.cpp/examples/lookahead/CMakeLists.txt +0 -5
  82. package/src/llama.cpp/examples/lookahead/lookahead.cpp +0 -472
  83. package/src/llama.cpp/examples/lookup/CMakeLists.txt +0 -23
  84. package/src/llama.cpp/examples/lookup/lookup-create.cpp +0 -40
  85. package/src/llama.cpp/examples/lookup/lookup-merge.cpp +0 -47
  86. package/src/llama.cpp/examples/lookup/lookup-stats.cpp +0 -157
  87. package/src/llama.cpp/examples/lookup/lookup.cpp +0 -242
  88. package/src/llama.cpp/examples/parallel/CMakeLists.txt +0 -5
  89. package/src/llama.cpp/examples/parallel/parallel.cpp +0 -492
  90. package/src/llama.cpp/examples/passkey/CMakeLists.txt +0 -5
  91. package/src/llama.cpp/examples/passkey/passkey.cpp +0 -277
  92. package/src/llama.cpp/examples/retrieval/CMakeLists.txt +0 -5
  93. package/src/llama.cpp/examples/retrieval/retrieval.cpp +0 -304
  94. package/src/llama.cpp/examples/save-load-state/CMakeLists.txt +0 -5
  95. package/src/llama.cpp/examples/save-load-state/save-load-state.cpp +0 -246
  96. package/src/llama.cpp/examples/simple/CMakeLists.txt +0 -5
  97. package/src/llama.cpp/examples/simple/simple.cpp +0 -206
  98. package/src/llama.cpp/examples/simple-chat/CMakeLists.txt +0 -5
  99. package/src/llama.cpp/examples/simple-chat/simple-chat.cpp +0 -206
  100. package/src/llama.cpp/examples/simple-cmake-pkg/CMakeLists.txt +0 -11
  101. package/src/llama.cpp/examples/speculative/CMakeLists.txt +0 -5
  102. package/src/llama.cpp/examples/speculative/speculative.cpp +0 -644
  103. package/src/llama.cpp/examples/speculative-simple/CMakeLists.txt +0 -5
  104. package/src/llama.cpp/examples/speculative-simple/speculative-simple.cpp +0 -261
  105. package/src/llama.cpp/examples/sycl/CMakeLists.txt +0 -9
  106. package/src/llama.cpp/examples/sycl/build.sh +0 -23
  107. package/src/llama.cpp/examples/sycl/ls-sycl-device.cpp +0 -13
  108. package/src/llama.cpp/examples/sycl/run-llama2.sh +0 -27
  109. package/src/llama.cpp/examples/sycl/run-llama3.sh +0 -28
  110. package/src/llama.cpp/examples/sycl/win-build-sycl.bat +0 -33
  111. package/src/llama.cpp/examples/sycl/win-run-llama2.bat +0 -9
  112. package/src/llama.cpp/examples/sycl/win-run-llama3.bat +0 -9
  113. package/src/llama.cpp/examples/training/CMakeLists.txt +0 -5
  114. package/src/llama.cpp/examples/training/finetune.cpp +0 -96
  115. package/src/llama.cpp/ggml/cmake/GitVars.cmake +0 -22
  116. package/src/llama.cpp/ggml/cmake/common.cmake +0 -26
  117. package/src/llama.cpp/ggml/src/ggml-alloc.c +0 -1042
  118. package/src/llama.cpp/ggml/src/ggml-backend-impl.h +0 -255
  119. package/src/llama.cpp/ggml/src/ggml-backend-reg.cpp +0 -586
  120. package/src/llama.cpp/ggml/src/ggml-backend.cpp +0 -2008
  121. package/src/llama.cpp/ggml/src/ggml-blas/CMakeLists.txt +0 -87
  122. package/src/llama.cpp/ggml/src/ggml-blas/ggml-blas.cpp +0 -517
  123. package/src/llama.cpp/ggml/src/ggml-cann/CMakeLists.txt +0 -74
  124. package/src/llama.cpp/ggml/src/ggml-cann/acl_tensor.cpp +0 -179
  125. package/src/llama.cpp/ggml/src/ggml-cann/acl_tensor.h +0 -258
  126. package/src/llama.cpp/ggml/src/ggml-cann/aclnn_ops.cpp +0 -2863
  127. package/src/llama.cpp/ggml/src/ggml-cann/aclnn_ops.h +0 -1110
  128. package/src/llama.cpp/ggml/src/ggml-cann/common.h +0 -420
  129. package/src/llama.cpp/ggml/src/ggml-cann/ggml-cann.cpp +0 -2570
  130. package/src/llama.cpp/ggml/src/ggml-common.h +0 -1857
  131. package/src/llama.cpp/ggml/src/ggml-cpu/cmake/FindSIMD.cmake +0 -100
  132. package/src/llama.cpp/ggml/src/ggml-cuda/CMakeLists.txt +0 -184
  133. package/src/llama.cpp/ggml/src/ggml-cuda/vendors/cuda.h +0 -15
  134. package/src/llama.cpp/ggml/src/ggml-cuda/vendors/hip.h +0 -243
  135. package/src/llama.cpp/ggml/src/ggml-cuda/vendors/musa.h +0 -140
  136. package/src/llama.cpp/ggml/src/ggml-hip/CMakeLists.txt +0 -131
  137. package/src/llama.cpp/ggml/src/ggml-impl.h +0 -601
  138. package/src/llama.cpp/ggml/src/ggml-kompute/CMakeLists.txt +0 -166
  139. package/src/llama.cpp/ggml/src/ggml-kompute/ggml-kompute.cpp +0 -2251
  140. package/src/llama.cpp/ggml/src/ggml-metal/CMakeLists.txt +0 -120
  141. package/src/llama.cpp/ggml/src/ggml-metal/ggml-metal-impl.h +0 -622
  142. package/src/llama.cpp/ggml/src/ggml-musa/CMakeLists.txt +0 -113
  143. package/src/llama.cpp/ggml/src/ggml-opencl/CMakeLists.txt +0 -96
  144. package/src/llama.cpp/ggml/src/ggml-opencl/ggml-opencl.cpp +0 -5124
  145. package/src/llama.cpp/ggml/src/ggml-opt.cpp +0 -1037
  146. package/src/llama.cpp/ggml/src/ggml-quants.c +0 -5232
  147. package/src/llama.cpp/ggml/src/ggml-quants.h +0 -100
  148. package/src/llama.cpp/ggml/src/ggml-rpc/CMakeLists.txt +0 -9
  149. package/src/llama.cpp/ggml/src/ggml-rpc/ggml-rpc.cpp +0 -1813
  150. package/src/llama.cpp/ggml/src/ggml-sycl/CMakeLists.txt +0 -189
  151. package/src/llama.cpp/ggml/src/ggml-sycl/backend.hpp +0 -37
  152. package/src/llama.cpp/ggml/src/ggml-sycl/binbcast.cpp +0 -239
  153. package/src/llama.cpp/ggml/src/ggml-sycl/binbcast.hpp +0 -39
  154. package/src/llama.cpp/ggml/src/ggml-sycl/common.cpp +0 -83
  155. package/src/llama.cpp/ggml/src/ggml-sycl/common.hpp +0 -493
  156. package/src/llama.cpp/ggml/src/ggml-sycl/concat.cpp +0 -197
  157. package/src/llama.cpp/ggml/src/ggml-sycl/concat.hpp +0 -20
  158. package/src/llama.cpp/ggml/src/ggml-sycl/conv.cpp +0 -100
  159. package/src/llama.cpp/ggml/src/ggml-sycl/conv.hpp +0 -20
  160. package/src/llama.cpp/ggml/src/ggml-sycl/convert.cpp +0 -623
  161. package/src/llama.cpp/ggml/src/ggml-sycl/convert.hpp +0 -34
  162. package/src/llama.cpp/ggml/src/ggml-sycl/cpy.cpp +0 -701
  163. package/src/llama.cpp/ggml/src/ggml-sycl/cpy.hpp +0 -11
  164. package/src/llama.cpp/ggml/src/ggml-sycl/dequantize.hpp +0 -791
  165. package/src/llama.cpp/ggml/src/ggml-sycl/dmmv.cpp +0 -1160
  166. package/src/llama.cpp/ggml/src/ggml-sycl/dmmv.hpp +0 -27
  167. package/src/llama.cpp/ggml/src/ggml-sycl/dpct/helper.hpp +0 -2957
  168. package/src/llama.cpp/ggml/src/ggml-sycl/element_wise.cpp +0 -1536
  169. package/src/llama.cpp/ggml/src/ggml-sycl/element_wise.hpp +0 -75
  170. package/src/llama.cpp/ggml/src/ggml-sycl/gemm.hpp +0 -99
  171. package/src/llama.cpp/ggml/src/ggml-sycl/getrows.cpp +0 -311
  172. package/src/llama.cpp/ggml/src/ggml-sycl/getrows.hpp +0 -20
  173. package/src/llama.cpp/ggml/src/ggml-sycl/ggml-sycl.cpp +0 -4443
  174. package/src/llama.cpp/ggml/src/ggml-sycl/gla.cpp +0 -105
  175. package/src/llama.cpp/ggml/src/ggml-sycl/gla.hpp +0 -8
  176. package/src/llama.cpp/ggml/src/ggml-sycl/im2col.cpp +0 -136
  177. package/src/llama.cpp/ggml/src/ggml-sycl/im2col.hpp +0 -21
  178. package/src/llama.cpp/ggml/src/ggml-sycl/mmq.cpp +0 -3030
  179. package/src/llama.cpp/ggml/src/ggml-sycl/mmq.hpp +0 -33
  180. package/src/llama.cpp/ggml/src/ggml-sycl/mmvq.cpp +0 -1108
  181. package/src/llama.cpp/ggml/src/ggml-sycl/mmvq.hpp +0 -27
  182. package/src/llama.cpp/ggml/src/ggml-sycl/norm.cpp +0 -474
  183. package/src/llama.cpp/ggml/src/ggml-sycl/norm.hpp +0 -26
  184. package/src/llama.cpp/ggml/src/ggml-sycl/outprod.cpp +0 -46
  185. package/src/llama.cpp/ggml/src/ggml-sycl/outprod.hpp +0 -10
  186. package/src/llama.cpp/ggml/src/ggml-sycl/presets.hpp +0 -74
  187. package/src/llama.cpp/ggml/src/ggml-sycl/quants.hpp +0 -83
  188. package/src/llama.cpp/ggml/src/ggml-sycl/rope.cpp +0 -362
  189. package/src/llama.cpp/ggml/src/ggml-sycl/rope.hpp +0 -20
  190. package/src/llama.cpp/ggml/src/ggml-sycl/softmax.cpp +0 -264
  191. package/src/llama.cpp/ggml/src/ggml-sycl/softmax.hpp +0 -20
  192. package/src/llama.cpp/ggml/src/ggml-sycl/sycl_hw.cpp +0 -13
  193. package/src/llama.cpp/ggml/src/ggml-sycl/sycl_hw.hpp +0 -23
  194. package/src/llama.cpp/ggml/src/ggml-sycl/tsembd.cpp +0 -73
  195. package/src/llama.cpp/ggml/src/ggml-sycl/tsembd.hpp +0 -20
  196. package/src/llama.cpp/ggml/src/ggml-sycl/vecdotq.hpp +0 -1215
  197. package/src/llama.cpp/ggml/src/ggml-sycl/wkv.cpp +0 -305
  198. package/src/llama.cpp/ggml/src/ggml-sycl/wkv.hpp +0 -10
  199. package/src/llama.cpp/ggml/src/ggml-threading.cpp +0 -12
  200. package/src/llama.cpp/ggml/src/ggml-threading.h +0 -14
  201. package/src/llama.cpp/ggml/src/ggml-vulkan/CMakeLists.txt +0 -196
  202. package/src/llama.cpp/ggml/src/ggml-vulkan/ggml-vulkan.cpp +0 -10699
  203. package/src/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/CMakeLists.txt +0 -39
  204. package/src/llama.cpp/ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp +0 -751
  205. package/src/llama.cpp/ggml/src/ggml.c +0 -6550
  206. package/src/llama.cpp/ggml/src/gguf.cpp +0 -1330
  207. package/src/llama.cpp/models/.editorconfig +0 -1
  208. package/src/llama.cpp/models/ggml-vocab-aquila.gguf +0 -0
  209. package/src/llama.cpp/models/ggml-vocab-baichuan.gguf +0 -0
  210. package/src/llama.cpp/models/ggml-vocab-bert-bge.gguf +0 -0
  211. package/src/llama.cpp/models/ggml-vocab-bert-bge.gguf.inp +0 -112
  212. package/src/llama.cpp/models/ggml-vocab-bert-bge.gguf.out +0 -46
  213. package/src/llama.cpp/models/ggml-vocab-chameleon.gguf.inp +0 -112
  214. package/src/llama.cpp/models/ggml-vocab-chameleon.gguf.out +0 -46
  215. package/src/llama.cpp/models/ggml-vocab-command-r.gguf +0 -0
  216. package/src/llama.cpp/models/ggml-vocab-command-r.gguf.inp +0 -112
  217. package/src/llama.cpp/models/ggml-vocab-command-r.gguf.out +0 -46
  218. package/src/llama.cpp/models/ggml-vocab-deepseek-coder.gguf +0 -0
  219. package/src/llama.cpp/models/ggml-vocab-deepseek-coder.gguf.inp +0 -112
  220. package/src/llama.cpp/models/ggml-vocab-deepseek-coder.gguf.out +0 -46
  221. package/src/llama.cpp/models/ggml-vocab-deepseek-llm.gguf +0 -0
  222. package/src/llama.cpp/models/ggml-vocab-deepseek-llm.gguf.inp +0 -112
  223. package/src/llama.cpp/models/ggml-vocab-deepseek-llm.gguf.out +0 -46
  224. package/src/llama.cpp/models/ggml-vocab-deepseek-r1-qwen.gguf.inp +0 -112
  225. package/src/llama.cpp/models/ggml-vocab-deepseek-r1-qwen.gguf.out +0 -46
  226. package/src/llama.cpp/models/ggml-vocab-falcon.gguf +0 -0
  227. package/src/llama.cpp/models/ggml-vocab-falcon.gguf.inp +0 -112
  228. package/src/llama.cpp/models/ggml-vocab-falcon.gguf.out +0 -46
  229. package/src/llama.cpp/models/ggml-vocab-gpt-2.gguf +0 -0
  230. package/src/llama.cpp/models/ggml-vocab-gpt-2.gguf.inp +0 -112
  231. package/src/llama.cpp/models/ggml-vocab-gpt-2.gguf.out +0 -46
  232. package/src/llama.cpp/models/ggml-vocab-gpt-4o.gguf.inp +0 -112
  233. package/src/llama.cpp/models/ggml-vocab-gpt-4o.gguf.out +0 -46
  234. package/src/llama.cpp/models/ggml-vocab-gpt-neox.gguf +0 -0
  235. package/src/llama.cpp/models/ggml-vocab-llama-bpe.gguf +0 -0
  236. package/src/llama.cpp/models/ggml-vocab-llama-bpe.gguf.inp +0 -112
  237. package/src/llama.cpp/models/ggml-vocab-llama-bpe.gguf.out +0 -46
  238. package/src/llama.cpp/models/ggml-vocab-llama-spm.gguf +0 -0
  239. package/src/llama.cpp/models/ggml-vocab-llama-spm.gguf.inp +0 -112
  240. package/src/llama.cpp/models/ggml-vocab-llama-spm.gguf.out +0 -46
  241. package/src/llama.cpp/models/ggml-vocab-llama4.gguf.inp +0 -112
  242. package/src/llama.cpp/models/ggml-vocab-llama4.gguf.out +0 -46
  243. package/src/llama.cpp/models/ggml-vocab-mpt.gguf +0 -0
  244. package/src/llama.cpp/models/ggml-vocab-mpt.gguf.inp +0 -112
  245. package/src/llama.cpp/models/ggml-vocab-mpt.gguf.out +0 -46
  246. package/src/llama.cpp/models/ggml-vocab-phi-3.gguf +0 -0
  247. package/src/llama.cpp/models/ggml-vocab-phi-3.gguf.inp +0 -112
  248. package/src/llama.cpp/models/ggml-vocab-phi-3.gguf.out +0 -46
  249. package/src/llama.cpp/models/ggml-vocab-pixtral.gguf.inp +0 -112
  250. package/src/llama.cpp/models/ggml-vocab-pixtral.gguf.out +0 -46
  251. package/src/llama.cpp/models/ggml-vocab-qwen2.gguf +0 -0
  252. package/src/llama.cpp/models/ggml-vocab-qwen2.gguf.inp +0 -112
  253. package/src/llama.cpp/models/ggml-vocab-qwen2.gguf.out +0 -46
  254. package/src/llama.cpp/models/ggml-vocab-refact.gguf +0 -0
  255. package/src/llama.cpp/models/ggml-vocab-refact.gguf.inp +0 -112
  256. package/src/llama.cpp/models/ggml-vocab-refact.gguf.out +0 -46
  257. package/src/llama.cpp/models/ggml-vocab-roberta-bpe.gguf.inp +0 -112
  258. package/src/llama.cpp/models/ggml-vocab-roberta-bpe.gguf.out +0 -46
  259. package/src/llama.cpp/models/ggml-vocab-starcoder.gguf +0 -0
  260. package/src/llama.cpp/models/ggml-vocab-starcoder.gguf.inp +0 -112
  261. package/src/llama.cpp/models/ggml-vocab-starcoder.gguf.out +0 -46
  262. package/src/llama.cpp/pocs/CMakeLists.txt +0 -14
  263. package/src/llama.cpp/pocs/vdot/CMakeLists.txt +0 -9
  264. package/src/llama.cpp/pocs/vdot/q8dot.cpp +0 -173
  265. package/src/llama.cpp/pocs/vdot/vdot.cpp +0 -311
  266. package/src/llama.cpp/prompts/LLM-questions.txt +0 -49
  267. package/src/llama.cpp/prompts/alpaca.txt +0 -1
  268. package/src/llama.cpp/prompts/assistant.txt +0 -31
  269. package/src/llama.cpp/prompts/chat-with-baichuan.txt +0 -4
  270. package/src/llama.cpp/prompts/chat-with-bob.txt +0 -7
  271. package/src/llama.cpp/prompts/chat-with-qwen.txt +0 -1
  272. package/src/llama.cpp/prompts/chat-with-vicuna-v0.txt +0 -7
  273. package/src/llama.cpp/prompts/chat-with-vicuna-v1.txt +0 -7
  274. package/src/llama.cpp/prompts/chat.txt +0 -28
  275. package/src/llama.cpp/prompts/dan-modified.txt +0 -1
  276. package/src/llama.cpp/prompts/dan.txt +0 -1
  277. package/src/llama.cpp/prompts/mnemonics.txt +0 -93
  278. package/src/llama.cpp/prompts/parallel-questions.txt +0 -43
  279. package/src/llama.cpp/prompts/reason-act.txt +0 -18
  280. package/src/llama.cpp/requirements/requirements-all.txt +0 -15
  281. package/src/llama.cpp/requirements/requirements-compare-llama-bench.txt +0 -2
  282. package/src/llama.cpp/requirements/requirements-convert_hf_to_gguf.txt +0 -7
  283. package/src/llama.cpp/requirements/requirements-convert_hf_to_gguf_update.txt +0 -7
  284. package/src/llama.cpp/requirements/requirements-convert_legacy_llama.txt +0 -5
  285. package/src/llama.cpp/requirements/requirements-convert_llama_ggml_to_gguf.txt +0 -1
  286. package/src/llama.cpp/requirements/requirements-convert_lora_to_gguf.txt +0 -4
  287. package/src/llama.cpp/requirements/requirements-gguf_editor_gui.txt +0 -3
  288. package/src/llama.cpp/requirements/requirements-pydantic.txt +0 -3
  289. package/src/llama.cpp/requirements/requirements-test-tokenizer-random.txt +0 -1
  290. package/src/llama.cpp/requirements/requirements-tool_bench.txt +0 -12
  291. package/src/llama.cpp/requirements.txt +0 -13
  292. package/src/llama.cpp/scripts/build-info.sh +0 -30
  293. package/src/llama.cpp/scripts/install-oneapi.bat +0 -19
  294. package/src/llama.cpp/scripts/xxd.cmake +0 -16
  295. package/src/llama.cpp/tests/CMakeLists.txt +0 -177
  296. package/src/llama.cpp/tests/get-model.cpp +0 -21
  297. package/src/llama.cpp/tests/get-model.h +0 -2
  298. package/src/llama.cpp/tests/test-arg-parser.cpp +0 -178
  299. package/src/llama.cpp/tests/test-autorelease.cpp +0 -24
  300. package/src/llama.cpp/tests/test-backend-ops.cpp +0 -4793
  301. package/src/llama.cpp/tests/test-barrier.cpp +0 -94
  302. package/src/llama.cpp/tests/test-c.c +0 -7
  303. package/src/llama.cpp/tests/test-chat-template.cpp +0 -417
  304. package/src/llama.cpp/tests/test-chat.cpp +0 -985
  305. package/src/llama.cpp/tests/test-double-float.cpp +0 -57
  306. package/src/llama.cpp/tests/test-gbnf-validator.cpp +0 -109
  307. package/src/llama.cpp/tests/test-gguf.cpp +0 -1338
  308. package/src/llama.cpp/tests/test-grammar-integration.cpp +0 -1308
  309. package/src/llama.cpp/tests/test-grammar-llguidance.cpp +0 -1201
  310. package/src/llama.cpp/tests/test-grammar-parser.cpp +0 -519
  311. package/src/llama.cpp/tests/test-json-schema-to-grammar.cpp +0 -1304
  312. package/src/llama.cpp/tests/test-llama-grammar.cpp +0 -408
  313. package/src/llama.cpp/tests/test-log.cpp +0 -39
  314. package/src/llama.cpp/tests/test-model-load-cancel.cpp +0 -27
  315. package/src/llama.cpp/tests/test-mtmd-c-api.c +0 -63
  316. package/src/llama.cpp/tests/test-opt.cpp +0 -904
  317. package/src/llama.cpp/tests/test-quantize-fns.cpp +0 -186
  318. package/src/llama.cpp/tests/test-quantize-perf.cpp +0 -365
  319. package/src/llama.cpp/tests/test-quantize-stats.cpp +0 -424
  320. package/src/llama.cpp/tests/test-regex-partial.cpp +0 -288
  321. package/src/llama.cpp/tests/test-rope.cpp +0 -262
  322. package/src/llama.cpp/tests/test-sampling.cpp +0 -399
  323. package/src/llama.cpp/tests/test-tokenizer-0.cpp +0 -312
  324. package/src/llama.cpp/tests/test-tokenizer-1-bpe.cpp +0 -155
  325. package/src/llama.cpp/tests/test-tokenizer-1-spm.cpp +0 -125
  326. package/src/llama.cpp/tools/CMakeLists.txt +0 -39
  327. package/src/llama.cpp/tools/batched-bench/CMakeLists.txt +0 -5
  328. package/src/llama.cpp/tools/batched-bench/batched-bench.cpp +0 -204
  329. package/src/llama.cpp/tools/cvector-generator/CMakeLists.txt +0 -5
  330. package/src/llama.cpp/tools/cvector-generator/completions.txt +0 -582
  331. package/src/llama.cpp/tools/cvector-generator/cvector-generator.cpp +0 -508
  332. package/src/llama.cpp/tools/cvector-generator/mean.hpp +0 -48
  333. package/src/llama.cpp/tools/cvector-generator/negative.txt +0 -4
  334. package/src/llama.cpp/tools/cvector-generator/pca.hpp +0 -315
  335. package/src/llama.cpp/tools/cvector-generator/positive.txt +0 -4
  336. package/src/llama.cpp/tools/export-lora/CMakeLists.txt +0 -5
  337. package/src/llama.cpp/tools/export-lora/export-lora.cpp +0 -434
  338. package/src/llama.cpp/tools/gguf-split/CMakeLists.txt +0 -5
  339. package/src/llama.cpp/tools/gguf-split/gguf-split.cpp +0 -583
  340. package/src/llama.cpp/tools/imatrix/CMakeLists.txt +0 -5
  341. package/src/llama.cpp/tools/imatrix/imatrix.cpp +0 -667
  342. package/src/llama.cpp/tools/llama-bench/CMakeLists.txt +0 -5
  343. package/src/llama.cpp/tools/llama-bench/llama-bench.cpp +0 -2024
  344. package/src/llama.cpp/tools/main/CMakeLists.txt +0 -5
  345. package/src/llama.cpp/tools/main/main.cpp +0 -977
  346. package/src/llama.cpp/tools/mtmd/CMakeLists.txt +0 -58
  347. package/src/llama.cpp/tools/mtmd/clip-impl.h +0 -462
  348. package/src/llama.cpp/tools/mtmd/clip.cpp +0 -4024
  349. package/src/llama.cpp/tools/mtmd/clip.h +0 -101
  350. package/src/llama.cpp/tools/mtmd/deprecation-warning.cpp +0 -22
  351. package/src/llama.cpp/tools/mtmd/miniaudio.h +0 -93468
  352. package/src/llama.cpp/tools/mtmd/mtmd-audio.cpp +0 -855
  353. package/src/llama.cpp/tools/mtmd/mtmd-audio.h +0 -62
  354. package/src/llama.cpp/tools/mtmd/mtmd-cli.cpp +0 -377
  355. package/src/llama.cpp/tools/mtmd/mtmd-helper.cpp +0 -297
  356. package/src/llama.cpp/tools/mtmd/mtmd.cpp +0 -942
  357. package/src/llama.cpp/tools/mtmd/mtmd.h +0 -362
  358. package/src/llama.cpp/tools/mtmd/requirements.txt +0 -5
  359. package/src/llama.cpp/tools/perplexity/CMakeLists.txt +0 -5
  360. package/src/llama.cpp/tools/perplexity/perplexity.cpp +0 -2063
  361. package/src/llama.cpp/tools/quantize/CMakeLists.txt +0 -6
  362. package/src/llama.cpp/tools/quantize/quantize.cpp +0 -519
  363. package/src/llama.cpp/tools/rpc/CMakeLists.txt +0 -4
  364. package/src/llama.cpp/tools/rpc/rpc-server.cpp +0 -322
  365. package/src/llama.cpp/tools/run/CMakeLists.txt +0 -16
  366. package/src/llama.cpp/tools/run/linenoise.cpp/linenoise.cpp +0 -1995
  367. package/src/llama.cpp/tools/run/linenoise.cpp/linenoise.h +0 -137
  368. package/src/llama.cpp/tools/run/run.cpp +0 -1261
  369. package/src/llama.cpp/tools/server/CMakeLists.txt +0 -51
  370. package/src/llama.cpp/tools/server/bench/requirements.txt +0 -2
  371. package/src/llama.cpp/tools/server/httplib.h +0 -10506
  372. package/src/llama.cpp/tools/server/server.cpp +0 -4966
  373. package/src/llama.cpp/tools/server/tests/requirements.txt +0 -8
  374. package/src/llama.cpp/tools/server/utils.hpp +0 -1337
  375. package/src/llama.cpp/tools/tokenize/CMakeLists.txt +0 -5
  376. package/src/llama.cpp/tools/tokenize/tokenize.cpp +0 -416
  377. package/src/llama.cpp/tools/tts/CMakeLists.txt +0 -5
  378. package/src/llama.cpp/tools/tts/tts.cpp +0 -1092
@@ -1,112 +0,0 @@
1
- ied 4 ½ months
2
- __ggml_vocab_test__
3
- Führer
4
- __ggml_vocab_test__
5
-
6
- __ggml_vocab_test__
7
-
8
- __ggml_vocab_test__
9
-
10
- __ggml_vocab_test__
11
-
12
- __ggml_vocab_test__
13
-
14
- __ggml_vocab_test__
15
-
16
-
17
- __ggml_vocab_test__
18
-
19
-
20
-
21
- __ggml_vocab_test__
22
-
23
-
24
-
25
-
26
- __ggml_vocab_test__
27
-
28
-
29
- __ggml_vocab_test__
30
- Hello world
31
- __ggml_vocab_test__
32
- Hello world
33
- __ggml_vocab_test__
34
- Hello World
35
- __ggml_vocab_test__
36
- Hello World
37
- __ggml_vocab_test__
38
- Hello World!
39
- __ggml_vocab_test__
40
- Hello, world!
41
- __ggml_vocab_test__
42
- Hello, world!
43
- __ggml_vocab_test__
44
- this is 🦙.cpp
45
- __ggml_vocab_test__
46
- w048 7tuijk dsdfhu
47
- __ggml_vocab_test__
48
- нещо на Български
49
- __ggml_vocab_test__
50
- កាន់តែពិសេសអាចខលចេញ
51
- __ggml_vocab_test__
52
- 🚀 (normal) 😶‍🌫️ (multiple emojis concatenated) ✅ (only emoji that has its own token)
53
- __ggml_vocab_test__
54
- Hello
55
- __ggml_vocab_test__
56
- Hello
57
- __ggml_vocab_test__
58
- Hello
59
- __ggml_vocab_test__
60
- Hello
61
- __ggml_vocab_test__
62
- Hello
63
- __ggml_vocab_test__
64
- Hello
65
- Hello
66
- __ggml_vocab_test__
67
- (
68
- __ggml_vocab_test__
69
-
70
- =
71
- __ggml_vocab_test__
72
- ' era
73
- __ggml_vocab_test__
74
- Hello, y'all! How are you 😁 ?我想在apple工作1314151天~
75
- __ggml_vocab_test__
76
- !!!!!!
77
- __ggml_vocab_test__
78
- 3
79
- __ggml_vocab_test__
80
- 33
81
- __ggml_vocab_test__
82
- 333
83
- __ggml_vocab_test__
84
- 3333
85
- __ggml_vocab_test__
86
- 33333
87
- __ggml_vocab_test__
88
- 333333
89
- __ggml_vocab_test__
90
- 3333333
91
- __ggml_vocab_test__
92
- 33333333
93
- __ggml_vocab_test__
94
- 333333333
95
- __ggml_vocab_test__
96
- Cửa Việt
97
- __ggml_vocab_test__
98
- discards
99
- __ggml_vocab_test__
100
-
101
-
102
-
103
-
104
-
105
-
106
-
107
-
108
-
109
-
110
-
111
- 🚀 (normal) 😶‍🌫️ (multiple emojis concatenated) ✅ 🦙🦙 3 33 333 3333 33333 333333 3333333 33333333 3.3 3..3 3...3 កាន់តែពិសេសអាច😁 ?我想在apple工作1314151天~ ------======= нещо на Български ''''''```````""""......!!!!!!?????? I've been 'told he's there, 'RE you sure? 'M not sure I'll make it, 'D you like some tea? We'Ve a'lL
112
- __ggml_vocab_test__
@@ -1,46 +0,0 @@
1
- 4833 225 38 225 143 140 17723
2
- 56 2006 3935 265
3
-
4
- 225
5
- 261
6
- 264
7
- 202
8
- 203
9
- 478
10
- 2831
11
- 15773
12
- 8279 5788
13
- 12000 5788
14
- 8279 10896
15
- 12000 10896
16
- 12000 10896 19
17
- 8279 30 5788 19
18
- 12000 30 5788 19
19
- 458 438 5945 118 252 32 3766
20
- 105 34 38 42 225 41 102 1707 12530 10180 1479 8278
21
- 39862 8372 1039 9446 40242 13852 2053 8949 12531 1520 10700
22
- 14574 227 14574 133 14574 246 30457 238 14574 242 30457 229 14574 249 14574 134 14574 258 30457 228 14574 258 14574 114 14574 133 14574 232 14574 228 14574 254 14574 232 30457 228 14574 236
23
- 3807 253 227 308 4382 27 18458 133 46113 44967 123 13868 308 12565 19775 33071 40824 733 27 41889 308 2585 22680 688 1401 2819 4369 2404 27
24
- 8279
25
- 12000
26
- 225 12000
27
- 261 12000
28
- 264 12000
29
- 264 12000 284 12000
30
- 308
31
- 203 280
32
- 25 34666
33
- 8279 30 533 25 464 19 4971 884 844 18458 228 1018 4982 13368 2909 9513 17827 35 37 35 38 35 39 35 11873 47838
34
- 9163 3202
35
- 37
36
- 37 37
37
- 37 37 37
38
- 37 37 37 37
39
- 37 37 37 37 37
40
- 37 37 37 37 37 37
41
- 37 37 37 37 37 37 37
42
- 37 37 37 37 37 37 37 37
43
- 37 37 37 37 37 37 37 37 37
44
- 53 33934 83 33217 17102 102
45
- 1214 12258
46
- 334 719 8878 202 10885 4222 16104 28570 203 3807 253 227 308 4382 27 18458 133 46113 44967 123 13868 308 12565 19775 33071 40824 733 27 41889 5945 118 252 3807 118 252 225 37 225 37 37 225 37 37 37 225 37 37 37 37 225 37 37 37 37 37 225 37 37 37 37 37 37 225 37 37 37 37 37 37 37 225 37 37 37 37 37 37 37 37 225 37 32 37 225 37 497 37 225 37 1179 37 225 14574 227 14574 133 14574 246 30457 238 14574 242 30457 229 14574 249 14574 134 14574 258 30457 228 14574 258 14574 114 14574 133 14574 232 36628 228 1018 4982 13368 2909 9513 17827 35 37 35 38 35 39 35 11873 47838 20921 16623 13028 8372 1039 9446 40242 13852 2053 8949 12531 1520 10700 5881 9592 13299 914 31753 31359 9163 3202 35472 10397 439 4763 2583 330 102 1455 938 1182 2017 30 330 613 844 3654 49 330 63 646 3654 439 4621 1930 561 30 330 54 844 2124 1629 35993 49 2688 25 7709 312 25 94 62
@@ -1,112 +0,0 @@
1
- ied 4 ½ months
2
- __ggml_vocab_test__
3
- Führer
4
- __ggml_vocab_test__
5
-
6
- __ggml_vocab_test__
7
-
8
- __ggml_vocab_test__
9
-
10
- __ggml_vocab_test__
11
-
12
- __ggml_vocab_test__
13
-
14
- __ggml_vocab_test__
15
-
16
-
17
- __ggml_vocab_test__
18
-
19
-
20
-
21
- __ggml_vocab_test__
22
-
23
-
24
-
25
-
26
- __ggml_vocab_test__
27
-
28
-
29
- __ggml_vocab_test__
30
- Hello world
31
- __ggml_vocab_test__
32
- Hello world
33
- __ggml_vocab_test__
34
- Hello World
35
- __ggml_vocab_test__
36
- Hello World
37
- __ggml_vocab_test__
38
- Hello World!
39
- __ggml_vocab_test__
40
- Hello, world!
41
- __ggml_vocab_test__
42
- Hello, world!
43
- __ggml_vocab_test__
44
- this is 🦙.cpp
45
- __ggml_vocab_test__
46
- w048 7tuijk dsdfhu
47
- __ggml_vocab_test__
48
- нещо на Български
49
- __ggml_vocab_test__
50
- កាន់តែពិសេសអាចខលចេញ
51
- __ggml_vocab_test__
52
- 🚀 (normal) 😶‍🌫️ (multiple emojis concatenated) ✅ (only emoji that has its own token)
53
- __ggml_vocab_test__
54
- Hello
55
- __ggml_vocab_test__
56
- Hello
57
- __ggml_vocab_test__
58
- Hello
59
- __ggml_vocab_test__
60
- Hello
61
- __ggml_vocab_test__
62
- Hello
63
- __ggml_vocab_test__
64
- Hello
65
- Hello
66
- __ggml_vocab_test__
67
- (
68
- __ggml_vocab_test__
69
-
70
- =
71
- __ggml_vocab_test__
72
- ' era
73
- __ggml_vocab_test__
74
- Hello, y'all! How are you 😁 ?我想在apple工作1314151天~
75
- __ggml_vocab_test__
76
- !!!!!!
77
- __ggml_vocab_test__
78
- 3
79
- __ggml_vocab_test__
80
- 33
81
- __ggml_vocab_test__
82
- 333
83
- __ggml_vocab_test__
84
- 3333
85
- __ggml_vocab_test__
86
- 33333
87
- __ggml_vocab_test__
88
- 333333
89
- __ggml_vocab_test__
90
- 3333333
91
- __ggml_vocab_test__
92
- 33333333
93
- __ggml_vocab_test__
94
- 333333333
95
- __ggml_vocab_test__
96
- Cửa Việt
97
- __ggml_vocab_test__
98
- discards
99
- __ggml_vocab_test__
100
-
101
-
102
-
103
-
104
-
105
-
106
-
107
-
108
-
109
-
110
-
111
- 🚀 (normal) 😶‍🌫️ (multiple emojis concatenated) ✅ 🦙🦙 3 33 333 3333 33333 333333 3333333 33333333 3.3 3..3 3...3 កាន់តែពិសេសអាច😁 ?我想在apple工作1314151天~ ------======= нещо на Български ''''''```````""""......!!!!!!?????? I've been 'told he's there, 'RE you sure? 'M not sure I'll make it, 'D you like some tea? We'Ve a'lL
112
- __ggml_vocab_test__
@@ -1,46 +0,0 @@
1
- 2550 204 18430 377
2
- 597 2768 298 8564
3
-
4
- 1437
5
- 1437 1437
6
- 1437 1437 1437
7
- 50117
8
- 50118
9
- 50140
10
- 50140 50118
11
- 50117 50118
12
- 31414 232
13
- 20920 232
14
- 31414 623
15
- 20920 623
16
- 20920 623 328
17
- 31414 6 232 328
18
- 20920 6 232 328
19
- 42 16 8103 18164 27 4 49317
20
- 605 40976 262 10109 18474 385 29 36807 6455
21
- 36765 25482 22063 23171 34251 18697 10809 26161 18697 3602 22063 27969 40966 25417 15264 26161 24269 36709 41171 35328
22
- 1376 17772 7471 1376 17772 19002 1376 17772 9085 1376 4333 13859 1376 17772 9357 1376 4333 9264 1376 17772 25448 1376 17772 18400 1376 17772 4333 1376 4333 10172 1376 17772 4333 1376 17772 7258 1376 17772 19002 1376 17772 5782 1376 17772 10172 1376 17772 3726 1376 17772 5782 1376 4333 10172 1376 17772 23171
23
- 6569 15113 7471 36 21113 43 17841 19002 17 8384 6569 14285 4958 12605 36 34654 2841 4203 354 10146 26511 1070 43 36174 5782 36 8338 21554 14 34 63 308 19233 43
24
- 31414
25
- 20920
26
- 1437 20920
27
- 1437 1437 20920
28
- 1437 1437 1437 20920
29
- 1437 1437 1437 20920 50118 1437 1437 1437 20920
30
- 36
31
- 50118 5457
32
- 108 3567
33
- 31414 6 1423 108 1250 328 1336 32 47 17841 10172 17487 47876 3602 48617 15264 46537 11423 27326 48494 8210 49233 1558 1570 27761 49429 43251 10809 17772
34
- 32376 12846
35
- 246
36
- 3103
37
- 25631
38
- 46152
39
- 3103 25631
40
- 46152 3103
41
- 46152 25631
42
- 46152 46152
43
- 46152 3103 25631
44
- 347 1376 2023 12410 102 16376 1376 2023 6382 90
45
- 9553 5954
46
- 50118 1437 50140 1437 50140 50118 1437 50117 1437 50117 50117 1437 50117 50118 1437 1437 50118 1437 1437 1437 50118 1437 1437 1437 1437 50118 1437 1437 1437 1437 1437 50118 6569 15113 7471 36 21113 43 17841 19002 17 8384 6569 14285 4958 12605 36 34654 2841 4203 354 10146 26511 1070 43 36174 5782 8103 18164 27 6569 18164 27 155 2357 30242 155 25631 30242 3103 30242 25631 30242 46152 30242 3103 25631 155 4 246 155 7586 246 155 734 246 25974 17772 7471 1376 17772 19002 1376 17772 9085 1376 4333 13859 1376 17772 9357 1376 4333 9264 1376 17772 25448 1376 17772 18400 1376 17772 4333 1376 4333 10172 1376 17772 4333 1376 17772 7258 1376 17772 19002 1376 17772 5782 18636 10172 17487 47876 3602 48617 15264 46537 11423 27326 48494 8210 49233 1558 1570 27761 49429 43251 10809 17772 36738 48332 47463 18697 10809 25482 22063 23171 34251 18697 10809 26161 18697 3602 22063 27969 40966 25417 15264 26161 24269 36709 41171 35328 128 49690 108 49972 49519 12905 48149 48149 43796 32376 12846 27282 28749 38 348 57 128 41042 37 18 89 6 128 4629 47 686 116 128 448 45 686 38 581 146 24 6 128 495 47 101 103 6845 116 166 108 30660 10 108 462 574
@@ -1,112 +0,0 @@
1
- ied 4 ½ months
2
- __ggml_vocab_test__
3
- Führer
4
- __ggml_vocab_test__
5
-
6
- __ggml_vocab_test__
7
-
8
- __ggml_vocab_test__
9
-
10
- __ggml_vocab_test__
11
-
12
- __ggml_vocab_test__
13
-
14
- __ggml_vocab_test__
15
-
16
-
17
- __ggml_vocab_test__
18
-
19
-
20
-
21
- __ggml_vocab_test__
22
-
23
-
24
-
25
-
26
- __ggml_vocab_test__
27
-
28
-
29
- __ggml_vocab_test__
30
- Hello world
31
- __ggml_vocab_test__
32
- Hello world
33
- __ggml_vocab_test__
34
- Hello World
35
- __ggml_vocab_test__
36
- Hello World
37
- __ggml_vocab_test__
38
- Hello World!
39
- __ggml_vocab_test__
40
- Hello, world!
41
- __ggml_vocab_test__
42
- Hello, world!
43
- __ggml_vocab_test__
44
- this is 🦙.cpp
45
- __ggml_vocab_test__
46
- w048 7tuijk dsdfhu
47
- __ggml_vocab_test__
48
- нещо на Български
49
- __ggml_vocab_test__
50
- កាន់តែពិសេសអាចខលចេញ
51
- __ggml_vocab_test__
52
- 🚀 (normal) 😶‍🌫️ (multiple emojis concatenated) ✅ (only emoji that has its own token)
53
- __ggml_vocab_test__
54
- Hello
55
- __ggml_vocab_test__
56
- Hello
57
- __ggml_vocab_test__
58
- Hello
59
- __ggml_vocab_test__
60
- Hello
61
- __ggml_vocab_test__
62
- Hello
63
- __ggml_vocab_test__
64
- Hello
65
- Hello
66
- __ggml_vocab_test__
67
- (
68
- __ggml_vocab_test__
69
-
70
- =
71
- __ggml_vocab_test__
72
- ' era
73
- __ggml_vocab_test__
74
- Hello, y'all! How are you 😁 ?我想在apple工作1314151天~
75
- __ggml_vocab_test__
76
- !!!!!!
77
- __ggml_vocab_test__
78
- 3
79
- __ggml_vocab_test__
80
- 33
81
- __ggml_vocab_test__
82
- 333
83
- __ggml_vocab_test__
84
- 3333
85
- __ggml_vocab_test__
86
- 33333
87
- __ggml_vocab_test__
88
- 333333
89
- __ggml_vocab_test__
90
- 3333333
91
- __ggml_vocab_test__
92
- 33333333
93
- __ggml_vocab_test__
94
- 333333333
95
- __ggml_vocab_test__
96
- Cửa Việt
97
- __ggml_vocab_test__
98
- discards
99
- __ggml_vocab_test__
100
-
101
-
102
-
103
-
104
-
105
-
106
-
107
-
108
-
109
-
110
-
111
- 🚀 (normal) 😶‍🌫️ (multiple emojis concatenated) ✅ 🦙🦙 3 33 333 3333 33333 333333 3333333 33333333 3.3 3..3 3...3 កាន់តែពិសេសអាច😁 ?我想在apple工作1314151天~ ------======= нещо на Български ''''''```````""""......!!!!!!?????? I've been 'told he's there, 'RE you sure? 'M not sure I'll make it, 'D you like some tea? We'Ve a'lL
112
- __ggml_vocab_test__
@@ -1,46 +0,0 @@
1
- 4850 244 57 244 162 159 17722
2
- 75 2022 3943 284
3
-
4
- 244
5
- 280
6
- 283
7
- 221
8
- 222
9
- 499
10
- 3067
11
- 15767
12
- 8302 5810
13
- 12009 5810
14
- 8302 10914
15
- 12009 10914
16
- 12009 10914 38
17
- 8302 49 5810 38
18
- 12009 49 5810 38
19
- 477 458 5954 137 271 51 3779
20
- 124 53 57 61 244 60 121 1726 12568 10240 1519 8290
21
- 39916 8389 1059 9504 40216 13858 2073 8983 12571 1539 10721
22
- 14566 246 14566 152 14566 265 30428 257 14566 261 30428 248 14566 268 14566 153 14566 277 30428 247 14566 277 14566 133 14566 152 14566 251 14566 247 14566 273 14566 251 30428 247 14566 255
23
- 3822 272 246 327 4434 46 18445 152 46030 45022 142 13878 327 12585 19884 33773 40920 751 46 41839 327 2605 22716 708 1421 2840 4387 2421 46
24
- 8302
25
- 12009
26
- 244 12009
27
- 280 12009
28
- 283 12009
29
- 283 12009 303 12009
30
- 327
31
- 222 299
32
- 44 34719
33
- 8302 49 553 44 483 38 4998 904 863 18445 247 1037 4995 13379 2924 9515 17823 54 56 54 57 54 58 54 11904 47892
34
- 9221 3226
35
- 56
36
- 56 56
37
- 56 56 56
38
- 56 56 56 56
39
- 56 56 56 56 56
40
- 56 56 56 56 56 56
41
- 56 56 56 56 56 56 56
42
- 56 56 56 56 56 56 56 56
43
- 56 56 56 56 56 56 56 56 56
44
- 72 34269 102 33245 17234 121
45
- 1236 12266
46
- 353 736 8886 221 10883 4238 16101 28540 222 3822 272 246 327 4434 46 18445 152 46030 45022 142 13878 327 12585 19884 33773 40920 751 46 41839 5954 137 271 3822 137 271 244 56 244 56 56 244 56 56 56 244 56 56 56 56 244 56 56 56 56 56 244 56 56 56 56 56 56 244 56 56 56 56 56 56 56 244 56 56 56 56 56 56 56 56 244 56 51 56 244 56 516 56 244 56 1198 56 244 14566 246 14566 152 14566 265 30428 257 14566 261 30428 248 14566 268 14566 153 14566 277 30428 247 14566 277 14566 133 14566 152 14566 251 36570 247 1037 4995 13379 2924 9515 17823 54 56 54 57 54 58 54 11904 47892 20895 16625 13047 8389 1059 9504 40216 13858 2073 8983 12571 1539 10721 5918 9643 13298 932 31723 31330 9221 3226 35426 10400 457 4783 2602 349 121 1477 957 1200 2038 49 349 632 863 3673 68 349 82 666 3673 457 4650 1949 580 49 349 73 863 2144 1649 35941 68 2726 44 7728 331 44 113 81
@@ -1,14 +0,0 @@
1
- # dependencies
2
-
3
- find_package(Threads REQUIRED)
4
-
5
- # third-party
6
-
7
- include_directories(${CMAKE_CURRENT_SOURCE_DIR})
8
-
9
- if (EMSCRIPTEN)
10
- else()
11
- if (NOT GGML_BACKEND_DL)
12
- add_subdirectory(vdot)
13
- endif()
14
- endif()
@@ -1,9 +0,0 @@
1
- set(TARGET llama-vdot)
2
- add_executable(${TARGET} vdot.cpp)
3
- target_link_libraries(${TARGET} PRIVATE common llama ${CMAKE_THREAD_LIBS_INIT})
4
- target_compile_features(${TARGET} PRIVATE cxx_std_17)
5
-
6
- set(TARGET llama-q8dot)
7
- add_executable(${TARGET} q8dot.cpp)
8
- target_link_libraries(${TARGET} PRIVATE common llama ${CMAKE_THREAD_LIBS_INIT})
9
- target_compile_features(${TARGET} PRIVATE cxx_std_17)
@@ -1,173 +0,0 @@
1
- #include <cstdio>
2
- #include <type_traits>
3
- #include <vector>
4
- #include <random>
5
- #include <chrono>
6
- #include <cstdlib>
7
- #include <cmath>
8
- #include <cassert>
9
- #include <cstring>
10
- #include <array>
11
- #include <type_traits>
12
-
13
- #include <ggml.h>
14
- #include <ggml-cpu.h>
15
-
16
- constexpr int kVecSize = 1 << 16;
17
-
18
- // Copy-pasted from ggml.c
19
- #define QK4_0 32
20
- typedef struct {
21
- float d; // delta
22
- uint8_t qs[QK4_0 / 2]; // nibbles / quants
23
- } block_q4_0;
24
- static_assert(sizeof(block_q4_0) == sizeof(float) + QK4_0 / 2, "wrong q4_0 block size/padding");
25
-
26
- #define QK4_1 32
27
- typedef struct {
28
- float d; // delta
29
- float m; // min
30
- uint8_t qs[QK4_1 / 2]; // nibbles / quants
31
- } block_q4_1;
32
- static_assert(sizeof(block_q4_1) == sizeof(float) * 2 + QK4_1 / 2, "wrong q4_1 block size/padding");
33
-
34
- // Copy-pasted from ggml.c
35
- #define QK8_0 32
36
- typedef struct {
37
- float d; // delta
38
- float s; // d * sum(qs[i])
39
- int8_t qs[QK8_0]; // quants
40
- } block_q8_0;
41
- static_assert(sizeof(block_q8_0) == 2*sizeof(float) + QK8_0, "wrong q8_0 block size/padding");
42
-
43
- static_assert(QK4_1 == QK8_0, "QK4_1 and QK8_0 must be the same");
44
- static_assert(QK4_0 == QK8_0, "QK4_0 and QK8_0 must be the same");
45
-
46
- template <typename T>
47
- static void fillQ4blocks(std::vector<T>& blocks, std::mt19937& rndm) {
48
- for (auto& b : blocks) {
49
- b.d = 1;
50
- for (int i=0; i<QK4_1/2; ++i) {
51
- uint8_t v1 = rndm() >> 28;
52
- uint8_t v2 = rndm() >> 28;
53
- b.qs[i] = v1 | (v2 << 4);
54
- }
55
- }
56
- }
57
-
58
- static void fillQ80blocks(std::vector<block_q8_0>& blocks, std::mt19937& rndm) {
59
- for (auto& b : blocks) {
60
- b.d = 1;
61
- int sum = 0;
62
- for (int i=0; i<QK8_0; ++i) {
63
- b.qs[i] = (rndm() >> 24) - 128;
64
- sum += b.qs[i];
65
- }
66
- b.s = b.d * sum;
67
- }
68
- }
69
-
70
- static float simpleDot(const block_q4_0& x, const block_q8_0& y) {
71
- int s1 = 0; //, s2 = 0;
72
- for (int i=0; i<QK4_1/2; i+=2) {
73
- int v1 = x.qs[i+0] & 0xf;
74
- int v2 = x.qs[i+0] >> 4;
75
- int v3 = x.qs[i+1] & 0xf;
76
- int v4 = x.qs[i+1] >> 4;
77
- int j = 2*i;
78
- s1 += v1*y.qs[j] + v2*y.qs[j+1] + v3*y.qs[j+2] + v4*y.qs[j+3];
79
- //s2 += y.qs[j] + y.qs[j+1] + y.qs[j+2] + y.qs[j+3];
80
- }
81
- return y.d * x.d * s1 - 8 * x.d * y.s;
82
- //return y.d * x.d * (s1 - 8 * s2);
83
- }
84
-
85
- static float simpleDot(const block_q4_1& x, const block_q8_0& y) {
86
- int s1 = 0; //, s2 = 0;
87
- for (int i=0; i<QK4_1/2; i+=2) {
88
- int v1 = x.qs[i+0] & 0xf;
89
- int v2 = x.qs[i+0] >> 4;
90
- int v3 = x.qs[i+1] & 0xf;
91
- int v4 = x.qs[i+1] >> 4;
92
- int j = 2*i;
93
- s1 += v1*y.qs[j] + v2*y.qs[j+1] + v3*y.qs[j+2] + v4*y.qs[j+3];
94
- //s2 += y.qs[j] + y.qs[j+1] + y.qs[j+2] + y.qs[j+3];
95
- }
96
- return y.d * x.d * s1 + y.s * x.m;
97
- //return y.d * (x.d * s1 + x.m * s2);
98
- }
99
-
100
- struct Stat {
101
- double sum = 0, sumt = 0, sumt2 = 0, maxt = 0;
102
- int nloop = 0;
103
- void addResult(double s, double t) {
104
- sum += s;
105
- sumt += t; sumt2 += t*t; maxt = std::max(maxt, t);
106
- ++nloop;
107
- }
108
- void reportResult(const char* title) const {
109
- if (nloop < 1) {
110
- printf("%s(%s): no result\n",__func__,title);
111
- return;
112
- }
113
- printf("============ %s\n",title);
114
- printf("<dot> = %g\n",sum/nloop);
115
- auto t = sumt/nloop, dt = sumt2/nloop - t*t;
116
- if (dt > 0) dt = sqrt(dt);
117
- printf("<time> = %g +/- %g us. Max. time = %g us.\n",t,dt,maxt);
118
- }
119
- };
120
-
121
-
122
- int main(int argc, char** argv) {
123
-
124
- int nloop = argc > 1 ? atoi(argv[1]) : 10;
125
- int type = argc > 2 ? atoi(argv[2]) : 1;
126
-
127
- std::mt19937 rndm(1234);
128
-
129
- std::vector<block_q4_1> x41;
130
- std::vector<block_q4_0> x40;
131
- std::vector<block_q8_0> y(kVecSize);
132
- if (type == 0) x40.resize(kVecSize);
133
- else {
134
- x41.resize(kVecSize);
135
- for (auto& b : x41) b.m = 1;
136
- }
137
-
138
- auto ggml_type = type == 0 ? GGML_TYPE_Q4_0 : GGML_TYPE_Q4_1;
139
-
140
- const auto * funcs = ggml_get_type_traits_cpu(ggml_type);
141
-
142
- Stat simple, ggml;
143
-
144
- for (int iloop=0; iloop<nloop; ++iloop) {
145
-
146
- if (type == 0) fillQ4blocks(x40, rndm);
147
- else fillQ4blocks(x41, rndm);
148
- fillQ80blocks(y, rndm);
149
-
150
- auto t1 = std::chrono::high_resolution_clock::now();
151
- double s = 0;
152
- if (type == 0) for (int i=0; i<kVecSize; ++i) s += simpleDot(x40[i], y[i]);
153
- else for (int i=0; i<kVecSize; ++i) s += simpleDot(x41[i], y[i]);
154
- auto t2 = std::chrono::high_resolution_clock::now();
155
- auto t = 1e-3*std::chrono::duration_cast<std::chrono::nanoseconds>(t2-t1).count();
156
- if (iloop > 3) simple.addResult(s, t);
157
-
158
- t1 = std::chrono::high_resolution_clock::now();
159
- float fs;
160
- if (type == 0) funcs->vec_dot(kVecSize * QK4_1, &fs, 0, x40.data(), 0, y.data(), 0, 1);
161
- else funcs->vec_dot(kVecSize * QK4_1, &fs, 0, x41.data(), 0, y.data(), 0, 1);
162
- t2 = std::chrono::high_resolution_clock::now();
163
- t = 1e-3*std::chrono::duration_cast<std::chrono::nanoseconds>(t2-t1).count();
164
- if (iloop > 3) ggml.addResult(fs, t);
165
-
166
- }
167
-
168
- // Report the time (and the average of the dot products so the compiler does not come up with the idea
169
- // of optimizing away the function calls after figuring that the result is not used).
170
- simple.reportResult("Simple");
171
- ggml.reportResult("ggml");
172
- return 0;
173
- }