cactus-react-native 0.2.10 → 1.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (510) hide show
  1. package/Cactus.podspec +34 -0
  2. package/LICENSE +38 -0
  3. package/README.md +283 -722
  4. package/android/CMakeLists.txt +40 -0
  5. package/android/build.gradle +68 -44
  6. package/android/gradle.properties +5 -5
  7. package/android/src/main/AndroidManifest.xml +1 -3
  8. package/android/src/main/cpp/cpp-adapter.cpp +6 -0
  9. package/android/src/main/java/com/margelo/nitro/cactus/CactusPackage.kt +22 -0
  10. package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusCrypto.kt +38 -0
  11. package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusDeviceInfo.kt +24 -0
  12. package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusFileSystem.kt +227 -0
  13. package/android/src/main/jniLibs/arm64-v8a/{libcactus.so → libcactus.a} +0 -0
  14. package/android/src/main/jniLibs/arm64-v8a/libcactus_util.so +0 -0
  15. package/cpp/HybridCactus.cpp +123 -0
  16. package/cpp/HybridCactus.hpp +35 -0
  17. package/cpp/HybridCactusUtil.cpp +45 -0
  18. package/cpp/HybridCactusUtil.hpp +26 -0
  19. package/cpp/cactus_ffi.h +55 -0
  20. package/cpp/cactus_util.h +25 -0
  21. package/ios/HybridCactusCrypto.swift +37 -0
  22. package/ios/HybridCactusDeviceInfo.swift +32 -0
  23. package/ios/HybridCactusFileSystem.swift +234 -0
  24. package/ios/cactus.xcframework/{info.plist → Info.plist} +2 -37
  25. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/cactus.h +8 -229
  26. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/cactus_ffi.h +28 -229
  27. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/engine.h +347 -0
  28. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ffi_utils.h +286 -0
  29. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/graph.h +319 -0
  30. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/kernel.h +254 -0
  31. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/kernel_utils.h +343 -0
  32. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Info.plist +0 -0
  33. package/ios/cactus.xcframework/ios-arm64/cactus.framework/cactus +0 -0
  34. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/cactus.h +11 -0
  35. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/cactus_ffi.h +55 -0
  36. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/engine.h +347 -0
  37. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/ffi_utils.h +286 -0
  38. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/graph.h +319 -0
  39. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/kernel.h +254 -0
  40. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/kernel_utils.h +343 -0
  41. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Info.plist +0 -0
  42. package/ios/cactus.xcframework/{tvos-arm64_x86_64-simulator → ios-arm64-simulator}/cactus.framework/_CodeSignature/CodeResources +1 -1
  43. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/cactus +0 -0
  44. package/ios/cactus_util.xcframework/Info.plist +39 -0
  45. package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/cactus_util.h +25 -0
  46. package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/ios_utils.h +10 -0
  47. package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/logging.h +25 -0
  48. package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Info.plist +0 -0
  49. package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/cactus_util +0 -0
  50. package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/cactus_util.h +25 -0
  51. package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/ios_utils.h +10 -0
  52. package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/logging.h +25 -0
  53. package/ios/{cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework → cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework}/Info.plist +0 -0
  54. package/ios/{cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework → cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework}/_CodeSignature/CodeResources +36 -2
  55. package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/cactus_util +0 -0
  56. package/lib/module/api/Database.js +60 -0
  57. package/lib/module/api/Database.js.map +1 -0
  58. package/lib/module/classes/CactusLM.js +149 -0
  59. package/lib/module/classes/CactusLM.js.map +1 -0
  60. package/lib/module/config/CactusConfig.js +6 -0
  61. package/lib/module/config/CactusConfig.js.map +1 -0
  62. package/lib/module/constants/packageVersion.js +4 -0
  63. package/lib/module/constants/packageVersion.js.map +1 -0
  64. package/lib/module/hooks/useCactusLM.js +233 -0
  65. package/lib/module/hooks/useCactusLM.js.map +1 -0
  66. package/lib/module/index.js +9 -409
  67. package/lib/module/index.js.map +1 -1
  68. package/lib/module/native/Cactus.js +50 -0
  69. package/lib/module/native/Cactus.js.map +1 -0
  70. package/lib/module/native/CactusCrypto.js +10 -0
  71. package/lib/module/native/CactusCrypto.js.map +1 -0
  72. package/lib/module/native/CactusDeviceInfo.js +13 -0
  73. package/lib/module/native/CactusDeviceInfo.js.map +1 -0
  74. package/lib/module/native/CactusFileSystem.js +35 -0
  75. package/lib/module/native/CactusFileSystem.js.map +1 -0
  76. package/lib/module/native/CactusUtil.js +23 -0
  77. package/lib/module/native/CactusUtil.js.map +1 -0
  78. package/lib/module/native/index.js +8 -0
  79. package/lib/module/native/index.js.map +1 -0
  80. package/lib/module/specs/Cactus.nitro.js +4 -0
  81. package/lib/module/specs/Cactus.nitro.js.map +1 -0
  82. package/lib/module/specs/CactusCrypto.nitro.js +4 -0
  83. package/lib/module/specs/CactusCrypto.nitro.js.map +1 -0
  84. package/lib/module/specs/CactusDeviceInfo.nitro.js +4 -0
  85. package/lib/module/specs/CactusDeviceInfo.nitro.js.map +1 -0
  86. package/lib/module/specs/CactusFileSystem.nitro.js +4 -0
  87. package/lib/module/specs/CactusFileSystem.nitro.js.map +1 -0
  88. package/lib/module/specs/CactusUtil.nitro.js +4 -0
  89. package/lib/module/specs/CactusUtil.nitro.js.map +1 -0
  90. package/lib/module/telemetry/Telemetry.js +100 -0
  91. package/lib/module/telemetry/Telemetry.js.map +1 -0
  92. package/lib/module/types/CactusLM.js +2 -0
  93. package/lib/module/types/CactusLM.js.map +1 -0
  94. package/lib/module/types/CactusModel.js +2 -0
  95. package/lib/module/types/CactusModel.js.map +1 -0
  96. package/lib/module/utils/error.js +4 -0
  97. package/lib/module/utils/error.js.map +1 -0
  98. package/lib/typescript/package.json +1 -0
  99. package/lib/typescript/src/api/Database.d.ts +11 -0
  100. package/lib/typescript/src/api/Database.d.ts.map +1 -0
  101. package/lib/typescript/src/classes/CactusLM.d.ts +25 -0
  102. package/lib/typescript/src/classes/CactusLM.d.ts.map +1 -0
  103. package/lib/typescript/src/config/CactusConfig.d.ts +5 -0
  104. package/lib/typescript/src/config/CactusConfig.d.ts.map +1 -0
  105. package/lib/typescript/src/constants/packageVersion.d.ts +2 -0
  106. package/lib/typescript/src/constants/packageVersion.d.ts.map +1 -0
  107. package/lib/typescript/src/hooks/useCactusLM.d.ts +20 -0
  108. package/lib/typescript/src/hooks/useCactusLM.d.ts.map +1 -0
  109. package/lib/typescript/src/index.d.ts +6 -0
  110. package/lib/typescript/src/index.d.ts.map +1 -0
  111. package/lib/typescript/src/native/Cactus.d.ts +11 -0
  112. package/lib/typescript/src/native/Cactus.d.ts.map +1 -0
  113. package/lib/typescript/src/native/CactusCrypto.d.ts +5 -0
  114. package/lib/typescript/src/native/CactusCrypto.d.ts.map +1 -0
  115. package/lib/typescript/src/native/CactusDeviceInfo.d.ts +7 -0
  116. package/lib/typescript/src/native/CactusDeviceInfo.d.ts.map +1 -0
  117. package/lib/typescript/src/native/CactusFileSystem.d.ts +13 -0
  118. package/lib/typescript/src/native/CactusFileSystem.d.ts.map +1 -0
  119. package/lib/typescript/src/native/CactusUtil.d.ts +6 -0
  120. package/lib/typescript/src/native/CactusUtil.d.ts.map +1 -0
  121. package/lib/typescript/src/native/index.d.ts +6 -0
  122. package/lib/typescript/src/native/index.d.ts.map +1 -0
  123. package/lib/typescript/src/specs/Cactus.nitro.d.ts +13 -0
  124. package/lib/typescript/src/specs/Cactus.nitro.d.ts.map +1 -0
  125. package/lib/typescript/src/specs/CactusCrypto.nitro.d.ts +8 -0
  126. package/lib/typescript/src/specs/CactusCrypto.nitro.d.ts.map +1 -0
  127. package/lib/typescript/src/specs/CactusDeviceInfo.nitro.d.ts +16 -0
  128. package/lib/typescript/src/specs/CactusDeviceInfo.nitro.d.ts.map +1 -0
  129. package/lib/typescript/src/specs/CactusFileSystem.nitro.d.ts +16 -0
  130. package/lib/typescript/src/specs/CactusFileSystem.nitro.d.ts.map +1 -0
  131. package/lib/typescript/src/specs/CactusUtil.nitro.d.ts +10 -0
  132. package/lib/typescript/src/specs/CactusUtil.nitro.d.ts.map +1 -0
  133. package/lib/typescript/src/telemetry/Telemetry.d.ts +30 -0
  134. package/lib/typescript/src/telemetry/Telemetry.d.ts.map +1 -0
  135. package/lib/typescript/src/types/CactusLM.d.ts +65 -0
  136. package/lib/typescript/src/types/CactusLM.d.ts.map +1 -0
  137. package/lib/typescript/src/types/CactusModel.d.ts +12 -0
  138. package/lib/typescript/src/types/CactusModel.d.ts.map +1 -0
  139. package/lib/typescript/src/utils/error.d.ts +2 -0
  140. package/lib/typescript/src/utils/error.d.ts.map +1 -0
  141. package/nitro.json +31 -0
  142. package/nitrogen/generated/android/c++/JDeviceInfo.hpp +74 -0
  143. package/nitrogen/generated/android/c++/JFunc_void_double.hpp +74 -0
  144. package/nitrogen/generated/android/c++/JHybridCactusCryptoSpec.cpp +65 -0
  145. package/nitrogen/generated/android/c++/JHybridCactusCryptoSpec.hpp +65 -0
  146. package/nitrogen/generated/android/c++/JHybridCactusDeviceInfoSpec.cpp +85 -0
  147. package/nitrogen/generated/android/c++/JHybridCactusDeviceInfoSpec.hpp +66 -0
  148. package/nitrogen/generated/android/c++/JHybridCactusFileSystemSpec.cpp +192 -0
  149. package/nitrogen/generated/android/c++/JHybridCactusFileSystemSpec.hpp +73 -0
  150. package/nitrogen/generated/android/cactus+autolinking.cmake +87 -0
  151. package/nitrogen/generated/android/cactus+autolinking.gradle +27 -0
  152. package/nitrogen/generated/android/cactusOnLoad.cpp +86 -0
  153. package/nitrogen/generated/android/cactusOnLoad.hpp +25 -0
  154. package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/DeviceInfo.kt +50 -0
  155. package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/Func_void_double.kt +80 -0
  156. package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusCryptoSpec.kt +58 -0
  157. package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusDeviceInfoSpec.kt +62 -0
  158. package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusFileSystemSpec.kt +95 -0
  159. package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/cactusOnLoad.kt +35 -0
  160. package/nitrogen/generated/ios/Cactus+autolinking.rb +60 -0
  161. package/nitrogen/generated/ios/Cactus-Swift-Cxx-Bridge.cpp +122 -0
  162. package/nitrogen/generated/ios/Cactus-Swift-Cxx-Bridge.hpp +373 -0
  163. package/nitrogen/generated/ios/Cactus-Swift-Cxx-Umbrella.hpp +60 -0
  164. package/nitrogen/generated/ios/CactusAutolinking.mm +69 -0
  165. package/nitrogen/generated/ios/CactusAutolinking.swift +55 -0
  166. package/nitrogen/generated/ios/c++/HybridCactusCryptoSpecSwift.cpp +11 -0
  167. package/nitrogen/generated/ios/c++/HybridCactusCryptoSpecSwift.hpp +77 -0
  168. package/nitrogen/generated/ios/c++/HybridCactusDeviceInfoSpecSwift.cpp +11 -0
  169. package/nitrogen/generated/ios/c++/HybridCactusDeviceInfoSpecSwift.hpp +88 -0
  170. package/nitrogen/generated/ios/c++/HybridCactusFileSystemSpecSwift.cpp +11 -0
  171. package/nitrogen/generated/ios/c++/HybridCactusFileSystemSpecSwift.hpp +143 -0
  172. package/nitrogen/generated/ios/swift/DeviceInfo.swift +98 -0
  173. package/nitrogen/generated/ios/swift/Func_void.swift +47 -0
  174. package/nitrogen/generated/ios/swift/Func_void_DeviceInfo.swift +47 -0
  175. package/nitrogen/generated/ios/swift/Func_void_bool.swift +47 -0
  176. package/nitrogen/generated/ios/swift/Func_void_double.swift +47 -0
  177. package/nitrogen/generated/ios/swift/Func_void_std__exception_ptr.swift +47 -0
  178. package/nitrogen/generated/ios/swift/Func_void_std__optional_std__string_.swift +54 -0
  179. package/nitrogen/generated/ios/swift/Func_void_std__string.swift +47 -0
  180. package/nitrogen/generated/ios/swift/HybridCactusCryptoSpec.swift +57 -0
  181. package/nitrogen/generated/ios/swift/HybridCactusCryptoSpec_cxx.swift +139 -0
  182. package/nitrogen/generated/ios/swift/HybridCactusDeviceInfoSpec.swift +58 -0
  183. package/nitrogen/generated/ios/swift/HybridCactusDeviceInfoSpec_cxx.swift +164 -0
  184. package/nitrogen/generated/ios/swift/HybridCactusFileSystemSpec.swift +65 -0
  185. package/nitrogen/generated/ios/swift/HybridCactusFileSystemSpec_cxx.swift +303 -0
  186. package/nitrogen/generated/shared/c++/DeviceInfo.hpp +92 -0
  187. package/nitrogen/generated/shared/c++/HybridCactusCryptoSpec.cpp +21 -0
  188. package/nitrogen/generated/shared/c++/HybridCactusCryptoSpec.hpp +63 -0
  189. package/nitrogen/generated/shared/c++/HybridCactusDeviceInfoSpec.cpp +22 -0
  190. package/nitrogen/generated/shared/c++/HybridCactusDeviceInfoSpec.hpp +67 -0
  191. package/nitrogen/generated/shared/c++/HybridCactusFileSystemSpec.cpp +29 -0
  192. package/nitrogen/generated/shared/c++/HybridCactusFileSystemSpec.hpp +73 -0
  193. package/nitrogen/generated/shared/c++/HybridCactusSpec.cpp +26 -0
  194. package/nitrogen/generated/shared/c++/HybridCactusSpec.hpp +71 -0
  195. package/nitrogen/generated/shared/c++/HybridCactusUtilSpec.cpp +23 -0
  196. package/nitrogen/generated/shared/c++/HybridCactusUtilSpec.hpp +66 -0
  197. package/package.json +84 -143
  198. package/src/api/Database.ts +83 -0
  199. package/src/classes/CactusLM.ts +203 -0
  200. package/src/config/CactusConfig.ts +4 -0
  201. package/src/constants/packageVersion.ts +1 -0
  202. package/src/hooks/useCactusLM.ts +282 -0
  203. package/src/index.tsx +23 -0
  204. package/src/native/Cactus.ts +79 -0
  205. package/src/native/CactusCrypto.ts +11 -0
  206. package/src/native/CactusDeviceInfo.ts +18 -0
  207. package/src/native/CactusFileSystem.ts +47 -0
  208. package/src/native/CactusUtil.ts +27 -0
  209. package/src/native/index.ts +5 -0
  210. package/src/specs/Cactus.nitro.ts +16 -0
  211. package/src/specs/CactusCrypto.nitro.ts +6 -0
  212. package/src/specs/CactusDeviceInfo.nitro.ts +15 -0
  213. package/src/specs/CactusFileSystem.nitro.ts +21 -0
  214. package/src/specs/CactusUtil.nitro.ts +8 -0
  215. package/src/telemetry/Telemetry.ts +159 -0
  216. package/src/types/CactusLM.ts +71 -0
  217. package/src/types/CactusModel.ts +14 -0
  218. package/src/utils/error.ts +2 -0
  219. package/LICENSE.txt +0 -20
  220. package/android/src/main/CMakeLists.txt +0 -139
  221. package/android/src/main/java/com/cactus/Cactus.java +0 -1190
  222. package/android/src/main/java/com/cactus/CactusPackage.java +0 -48
  223. package/android/src/main/java/com/cactus/LlamaContext.java +0 -814
  224. package/android/src/main/jni-utils.h +0 -100
  225. package/android/src/main/jni.cpp +0 -1605
  226. package/android/src/main/jniLibs/arm64-v8a/libcactus_v8.so +0 -0
  227. package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2.so +0 -0
  228. package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2_dotprod.so +0 -0
  229. package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2_dotprod_i8mm.so +0 -0
  230. package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2_i8mm.so +0 -0
  231. package/android/src/newarch/java/com/cactus/CactusModule.java +0 -206
  232. package/android/src/oldarch/java/com/cactus/CactusModule.java +0 -205
  233. package/cactus-react-native.podspec +0 -42
  234. package/ios/CMakeLists.txt +0 -131
  235. package/ios/Cactus.h +0 -6
  236. package/ios/Cactus.mm +0 -681
  237. package/ios/CactusContext.h +0 -81
  238. package/ios/CactusContext.mm +0 -1032
  239. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/chat.h +0 -145
  240. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/common.h +0 -674
  241. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-alloc.h +0 -76
  242. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-backend-impl.h +0 -255
  243. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-backend.h +0 -354
  244. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-common.h +0 -1857
  245. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-cpp.h +0 -39
  246. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-cpu.h +0 -143
  247. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-impl.h +0 -601
  248. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-metal-impl.h +0 -622
  249. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-metal.h +0 -66
  250. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-opt.h +0 -237
  251. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-quants.h +0 -100
  252. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-threading.h +0 -14
  253. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml.h +0 -2202
  254. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/gguf.h +0 -202
  255. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
  256. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/json.hpp +0 -24766
  257. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-adapter.h +0 -76
  258. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-arch.h +0 -437
  259. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-batch.h +0 -89
  260. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-chat.h +0 -58
  261. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-context.h +0 -276
  262. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-cparams.h +0 -39
  263. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-cpp.h +0 -30
  264. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-grammar.h +0 -173
  265. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-graph.h +0 -640
  266. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-hparams.h +0 -190
  267. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-impl.h +0 -61
  268. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-io.h +0 -35
  269. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-kv-cache.h +0 -515
  270. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-memory.h +0 -32
  271. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-mmap.h +0 -68
  272. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-model-loader.h +0 -169
  273. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-model-saver.h +0 -37
  274. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-model.h +0 -425
  275. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-sampling.h +0 -32
  276. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-vocab.h +0 -131
  277. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama.h +0 -1376
  278. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/log.h +0 -103
  279. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/minja/chat-template.hpp +0 -542
  280. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/minja/minja.hpp +0 -2974
  281. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/sampling.h +0 -107
  282. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/unicode-data.h +0 -20
  283. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/unicode.h +0 -66
  284. package/ios/cactus.xcframework/ios-arm64/cactus.framework/ggml-llama.metallib +0 -0
  285. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/cactus.h +0 -232
  286. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/cactus_ffi.h +0 -256
  287. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/chat.h +0 -145
  288. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/common.h +0 -674
  289. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-alloc.h +0 -76
  290. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend-impl.h +0 -255
  291. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend.h +0 -354
  292. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-common.h +0 -1857
  293. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpp.h +0 -39
  294. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpu.h +0 -143
  295. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-impl.h +0 -601
  296. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal-impl.h +0 -622
  297. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal.h +0 -66
  298. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-opt.h +0 -237
  299. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-quants.h +0 -100
  300. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-threading.h +0 -14
  301. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml.h +0 -2202
  302. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/gguf.h +0 -202
  303. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
  304. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/json.hpp +0 -24766
  305. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-adapter.h +0 -76
  306. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-arch.h +0 -437
  307. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-batch.h +0 -89
  308. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-chat.h +0 -58
  309. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-context.h +0 -276
  310. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-cparams.h +0 -39
  311. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-cpp.h +0 -30
  312. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-grammar.h +0 -173
  313. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-graph.h +0 -640
  314. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-hparams.h +0 -190
  315. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-impl.h +0 -61
  316. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-io.h +0 -35
  317. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-kv-cache.h +0 -515
  318. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-memory.h +0 -32
  319. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-mmap.h +0 -68
  320. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-loader.h +0 -169
  321. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-saver.h +0 -37
  322. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-model.h +0 -425
  323. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-sampling.h +0 -32
  324. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-vocab.h +0 -131
  325. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama.h +0 -1376
  326. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/log.h +0 -103
  327. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/minja/chat-template.hpp +0 -542
  328. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/minja/minja.hpp +0 -2974
  329. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/sampling.h +0 -107
  330. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/unicode-data.h +0 -20
  331. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/unicode.h +0 -66
  332. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/cactus +0 -0
  333. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/ggml-llama-sim.metallib +0 -0
  334. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/cactus.h +0 -232
  335. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/cactus_ffi.h +0 -256
  336. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/chat.h +0 -145
  337. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/common.h +0 -674
  338. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-alloc.h +0 -76
  339. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-backend-impl.h +0 -255
  340. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-backend.h +0 -354
  341. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-common.h +0 -1857
  342. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-cpp.h +0 -39
  343. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-cpu.h +0 -143
  344. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-impl.h +0 -601
  345. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-metal-impl.h +0 -622
  346. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-metal.h +0 -66
  347. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-opt.h +0 -237
  348. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-quants.h +0 -100
  349. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-threading.h +0 -14
  350. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml.h +0 -2202
  351. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/gguf.h +0 -202
  352. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
  353. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/json.hpp +0 -24766
  354. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-adapter.h +0 -76
  355. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-arch.h +0 -437
  356. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-batch.h +0 -89
  357. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-chat.h +0 -58
  358. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-context.h +0 -276
  359. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-cparams.h +0 -39
  360. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-cpp.h +0 -30
  361. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-grammar.h +0 -173
  362. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-graph.h +0 -640
  363. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-hparams.h +0 -190
  364. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-impl.h +0 -61
  365. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-io.h +0 -35
  366. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-kv-cache.h +0 -515
  367. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-memory.h +0 -32
  368. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-mmap.h +0 -68
  369. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-model-loader.h +0 -169
  370. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-model-saver.h +0 -37
  371. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-model.h +0 -425
  372. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-sampling.h +0 -32
  373. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-vocab.h +0 -131
  374. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama.h +0 -1376
  375. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/log.h +0 -103
  376. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/minja/chat-template.hpp +0 -542
  377. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/minja/minja.hpp +0 -2974
  378. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/sampling.h +0 -107
  379. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/unicode-data.h +0 -20
  380. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/unicode.h +0 -66
  381. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Info.plist +0 -0
  382. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/cactus +0 -0
  383. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/ggml-llama.metallib +0 -0
  384. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/cactus.h +0 -232
  385. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/cactus_ffi.h +0 -256
  386. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/chat.h +0 -145
  387. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/common.h +0 -674
  388. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-alloc.h +0 -76
  389. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend-impl.h +0 -255
  390. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend.h +0 -354
  391. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-common.h +0 -1857
  392. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpp.h +0 -39
  393. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpu.h +0 -143
  394. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-impl.h +0 -601
  395. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal-impl.h +0 -622
  396. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal.h +0 -66
  397. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-opt.h +0 -237
  398. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-quants.h +0 -100
  399. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-threading.h +0 -14
  400. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml.h +0 -2202
  401. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/gguf.h +0 -202
  402. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
  403. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/json.hpp +0 -24766
  404. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-adapter.h +0 -76
  405. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-arch.h +0 -437
  406. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-batch.h +0 -89
  407. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-chat.h +0 -58
  408. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-context.h +0 -276
  409. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-cparams.h +0 -39
  410. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-cpp.h +0 -30
  411. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-grammar.h +0 -173
  412. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-graph.h +0 -640
  413. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-hparams.h +0 -190
  414. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-impl.h +0 -61
  415. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-io.h +0 -35
  416. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-kv-cache.h +0 -515
  417. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-memory.h +0 -32
  418. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-mmap.h +0 -68
  419. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-loader.h +0 -169
  420. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-saver.h +0 -37
  421. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-model.h +0 -425
  422. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-sampling.h +0 -32
  423. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-vocab.h +0 -131
  424. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama.h +0 -1376
  425. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/log.h +0 -103
  426. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/minja/chat-template.hpp +0 -542
  427. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/minja/minja.hpp +0 -2974
  428. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/sampling.h +0 -107
  429. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/unicode-data.h +0 -20
  430. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/unicode.h +0 -66
  431. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Info.plist +0 -0
  432. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/cactus +0 -0
  433. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/ggml-llama-sim.metallib +0 -0
  434. package/lib/commonjs/NativeCactus.js +0 -9
  435. package/lib/commonjs/NativeCactus.js.map +0 -1
  436. package/lib/commonjs/agent.js +0 -73
  437. package/lib/commonjs/agent.js.map +0 -1
  438. package/lib/commonjs/chat.js +0 -73
  439. package/lib/commonjs/chat.js.map +0 -1
  440. package/lib/commonjs/index.js +0 -523
  441. package/lib/commonjs/index.js.map +0 -1
  442. package/lib/commonjs/lm.js +0 -272
  443. package/lib/commonjs/lm.js.map +0 -1
  444. package/lib/commonjs/package.json +0 -1
  445. package/lib/commonjs/projectId.js +0 -8
  446. package/lib/commonjs/projectId.js.map +0 -1
  447. package/lib/commonjs/remote.js +0 -100
  448. package/lib/commonjs/remote.js.map +0 -1
  449. package/lib/commonjs/telemetry.js +0 -102
  450. package/lib/commonjs/telemetry.js.map +0 -1
  451. package/lib/commonjs/tools.js +0 -72
  452. package/lib/commonjs/tools.js.map +0 -1
  453. package/lib/commonjs/tts.js +0 -29
  454. package/lib/commonjs/tts.js.map +0 -1
  455. package/lib/commonjs/vlm.js +0 -221
  456. package/lib/commonjs/vlm.js.map +0 -1
  457. package/lib/module/NativeCactus.js +0 -5
  458. package/lib/module/NativeCactus.js.map +0 -1
  459. package/lib/module/agent.js +0 -68
  460. package/lib/module/agent.js.map +0 -1
  461. package/lib/module/chat.js +0 -67
  462. package/lib/module/chat.js.map +0 -1
  463. package/lib/module/lm.js +0 -267
  464. package/lib/module/lm.js.map +0 -1
  465. package/lib/module/projectId.js +0 -4
  466. package/lib/module/projectId.js.map +0 -1
  467. package/lib/module/remote.js +0 -91
  468. package/lib/module/remote.js.map +0 -1
  469. package/lib/module/telemetry.js +0 -97
  470. package/lib/module/telemetry.js.map +0 -1
  471. package/lib/module/tools.js +0 -66
  472. package/lib/module/tools.js.map +0 -1
  473. package/lib/module/tts.js +0 -24
  474. package/lib/module/tts.js.map +0 -1
  475. package/lib/module/vlm.js +0 -216
  476. package/lib/module/vlm.js.map +0 -1
  477. package/lib/typescript/NativeCactus.d.ts +0 -252
  478. package/lib/typescript/NativeCactus.d.ts.map +0 -1
  479. package/lib/typescript/agent.d.ts +0 -31
  480. package/lib/typescript/agent.d.ts.map +0 -1
  481. package/lib/typescript/chat.d.ts +0 -23
  482. package/lib/typescript/chat.d.ts.map +0 -1
  483. package/lib/typescript/index.d.ts +0 -114
  484. package/lib/typescript/index.d.ts.map +0 -1
  485. package/lib/typescript/lm.d.ts +0 -36
  486. package/lib/typescript/lm.d.ts.map +0 -1
  487. package/lib/typescript/projectId.d.ts +0 -2
  488. package/lib/typescript/projectId.d.ts.map +0 -1
  489. package/lib/typescript/remote.d.ts +0 -8
  490. package/lib/typescript/remote.d.ts.map +0 -1
  491. package/lib/typescript/telemetry.d.ts +0 -25
  492. package/lib/typescript/telemetry.d.ts.map +0 -1
  493. package/lib/typescript/tools.d.ts +0 -36
  494. package/lib/typescript/tools.d.ts.map +0 -1
  495. package/lib/typescript/tts.d.ts +0 -10
  496. package/lib/typescript/tts.d.ts.map +0 -1
  497. package/lib/typescript/vlm.d.ts +0 -33
  498. package/lib/typescript/vlm.d.ts.map +0 -1
  499. package/scripts/postInstall.js +0 -33
  500. package/src/NativeCactus.ts +0 -317
  501. package/src/agent.ts +0 -112
  502. package/src/chat.ts +0 -91
  503. package/src/index.ts +0 -662
  504. package/src/lm.ts +0 -324
  505. package/src/projectId.ts +0 -1
  506. package/src/remote.ts +0 -113
  507. package/src/telemetry.ts +0 -137
  508. package/src/tools.ts +0 -94
  509. package/src/tts.ts +0 -42
  510. package/src/vlm.ts +0 -276
@@ -1,76 +0,0 @@
1
- #pragma once
2
-
3
- #include "llama.h"
4
-
5
- #include "ggml-cpp.h"
6
-
7
- #include <string>
8
- #include <unordered_map>
9
- #include <vector>
10
-
11
- // TODO: pimpl
12
-
13
- //
14
- // llama_adapter_cvec
15
- //
16
-
17
- struct llama_adapter_cvec {
18
- lm_ggml_tensor * tensor_for(int il) const;
19
-
20
- lm_ggml_tensor * apply_to(lm_ggml_context * ctx, lm_ggml_tensor * cur, int il) const;
21
-
22
- bool apply(
23
- const llama_model & model,
24
- const float * data,
25
- size_t len,
26
- int32_t n_embd,
27
- int32_t il_start,
28
- int32_t il_end);
29
-
30
- private:
31
- bool init(const llama_model & model);
32
-
33
- int32_t layer_start = -1;
34
- int32_t layer_end = -1;
35
-
36
- std::vector<lm_ggml_context_ptr> ctxs;
37
- std::vector<lm_ggml_backend_buffer_ptr> bufs;
38
-
39
- std::vector<lm_ggml_tensor *> tensors; // per layer
40
- };
41
-
42
- //
43
- // llama_adapter_lora
44
- //
45
-
46
- struct llama_adapter_lora_weight {
47
- lm_ggml_tensor * a = nullptr;
48
- lm_ggml_tensor * b = nullptr;
49
-
50
- // get actual scale based on rank and alpha
51
- float get_scale(float alpha, float adapter_scale) const {
52
- const float rank = (float) b->ne[0];
53
- const float scale = alpha ? adapter_scale * alpha / rank : adapter_scale;
54
- return scale;
55
- }
56
-
57
- llama_adapter_lora_weight() = default;
58
- llama_adapter_lora_weight(lm_ggml_tensor * a, lm_ggml_tensor * b) : a(a), b(b) {}
59
- };
60
-
61
- struct llama_adapter_lora {
62
- // map tensor name to lora_a_b
63
- std::unordered_map<std::string, llama_adapter_lora_weight> ab_map;
64
-
65
- std::vector<lm_ggml_context_ptr> ctxs;
66
- std::vector<lm_ggml_backend_buffer_ptr> bufs;
67
-
68
- float alpha;
69
-
70
- llama_adapter_lora() = default;
71
- ~llama_adapter_lora() = default;
72
-
73
- llama_adapter_lora_weight * get_weight(lm_ggml_tensor * w);
74
- };
75
-
76
- using llama_adapter_loras = std::unordered_map<llama_adapter_lora *, float>;
@@ -1,437 +0,0 @@
1
- #pragma once
2
-
3
- #include "ggml.h" // lm_ggml_op
4
-
5
- #include <string>
6
-
7
- //
8
- // gguf constants (sync with gguf.py)
9
- //
10
-
11
- enum llm_arch {
12
- LLM_ARCH_LLAMA,
13
- LLM_ARCH_LLAMA4,
14
- LLM_ARCH_DECI,
15
- LLM_ARCH_FALCON,
16
- LLM_ARCH_BAICHUAN,
17
- LLM_ARCH_GROK,
18
- LLM_ARCH_GPT2,
19
- LLM_ARCH_GPTJ,
20
- LLM_ARCH_GPTNEOX,
21
- LLM_ARCH_MPT,
22
- LLM_ARCH_STARCODER,
23
- LLM_ARCH_REFACT,
24
- LLM_ARCH_BERT,
25
- LLM_ARCH_NOMIC_BERT,
26
- LLM_ARCH_NOMIC_BERT_MOE,
27
- LLM_ARCH_JINA_BERT_V2,
28
- LLM_ARCH_BLOOM,
29
- LLM_ARCH_STABLELM,
30
- LLM_ARCH_QWEN,
31
- LLM_ARCH_QWEN2,
32
- LLM_ARCH_QWEN2MOE,
33
- LLM_ARCH_QWEN2VL,
34
- LLM_ARCH_QWEN3,
35
- LLM_ARCH_QWEN3MOE,
36
- LLM_ARCH_PHI2,
37
- LLM_ARCH_PHI3,
38
- LLM_ARCH_PHIMOE,
39
- LLM_ARCH_PLAMO,
40
- LLM_ARCH_CODESHELL,
41
- LLM_ARCH_ORION,
42
- LLM_ARCH_INTERNLM2,
43
- LLM_ARCH_MINICPM,
44
- LLM_ARCH_MINICPM3,
45
- LLM_ARCH_GEMMA,
46
- LLM_ARCH_GEMMA2,
47
- LLM_ARCH_GEMMA3,
48
- LLM_ARCH_STARCODER2,
49
- LLM_ARCH_MAMBA,
50
- LLM_ARCH_XVERSE,
51
- LLM_ARCH_COMMAND_R,
52
- LLM_ARCH_COHERE2,
53
- LLM_ARCH_DBRX,
54
- LLM_ARCH_OLMO,
55
- LLM_ARCH_OLMO2,
56
- LLM_ARCH_OLMOE,
57
- LLM_ARCH_OPENELM,
58
- LLM_ARCH_ARCTIC,
59
- LLM_ARCH_DEEPSEEK,
60
- LLM_ARCH_DEEPSEEK2,
61
- LLM_ARCH_CHATGLM,
62
- LLM_ARCH_GLM4,
63
- LLM_ARCH_BITNET,
64
- LLM_ARCH_T5,
65
- LLM_ARCH_T5ENCODER,
66
- LLM_ARCH_JAIS,
67
- LLM_ARCH_NEMOTRON,
68
- LLM_ARCH_EXAONE,
69
- LLM_ARCH_RWKV6,
70
- LLM_ARCH_RWKV6QWEN2,
71
- LLM_ARCH_RWKV7,
72
- LLM_ARCH_ARWKV7,
73
- LLM_ARCH_GRANITE,
74
- LLM_ARCH_GRANITE_MOE,
75
- LLM_ARCH_CHAMELEON,
76
- LLM_ARCH_WAVTOKENIZER_DEC,
77
- LLM_ARCH_PLM,
78
- LLM_ARCH_BAILINGMOE,
79
- LLM_ARCH_UNKNOWN,
80
- };
81
-
82
- enum llm_kv {
83
- LLM_KV_GENERAL_TYPE,
84
- LLM_KV_GENERAL_ARCHITECTURE,
85
- LLM_KV_GENERAL_QUANTIZATION_VERSION,
86
- LLM_KV_GENERAL_ALIGNMENT,
87
- LLM_KV_GENERAL_FILE_TYPE,
88
- LLM_KV_GENERAL_NAME,
89
- LLM_KV_GENERAL_AUTHOR,
90
- LLM_KV_GENERAL_VERSION,
91
- LLM_KV_GENERAL_URL,
92
- LLM_KV_GENERAL_DESCRIPTION,
93
- LLM_KV_GENERAL_LICENSE,
94
- LLM_KV_GENERAL_SOURCE_URL,
95
- LLM_KV_GENERAL_SOURCE_HF_REPO,
96
-
97
- LLM_KV_VOCAB_SIZE,
98
- LLM_KV_CONTEXT_LENGTH,
99
- LLM_KV_EMBEDDING_LENGTH,
100
- LLM_KV_FEATURES_LENGTH,
101
- LLM_KV_BLOCK_COUNT,
102
- LLM_KV_LEADING_DENSE_BLOCK_COUNT,
103
- LLM_KV_FEED_FORWARD_LENGTH,
104
- LLM_KV_EXPERT_FEED_FORWARD_LENGTH,
105
- LLM_KV_EXPERT_SHARED_FEED_FORWARD_LENGTH,
106
- LLM_KV_USE_PARALLEL_RESIDUAL,
107
- LLM_KV_TENSOR_DATA_LAYOUT,
108
- LLM_KV_EXPERT_COUNT,
109
- LLM_KV_EXPERT_USED_COUNT,
110
- LLM_KV_EXPERT_SHARED_COUNT,
111
- LLM_KV_EXPERT_WEIGHTS_SCALE,
112
- LLM_KV_EXPERT_WEIGHTS_NORM,
113
- LLM_KV_EXPERT_GATING_FUNC,
114
- LLM_KV_MOE_EVERY_N_LAYERS,
115
- LLM_KV_POOLING_TYPE,
116
- LLM_KV_LOGIT_SCALE,
117
- LLM_KV_DECODER_START_TOKEN_ID,
118
- LLM_KV_ATTN_LOGIT_SOFTCAPPING,
119
- LLM_KV_FINAL_LOGIT_SOFTCAPPING,
120
- LLM_KV_SWIN_NORM,
121
- LLM_KV_RESCALE_EVERY_N_LAYERS,
122
- LLM_KV_TIME_MIX_EXTRA_DIM,
123
- LLM_KV_TIME_DECAY_EXTRA_DIM,
124
- LLM_KV_RESIDUAL_SCALE,
125
- LLM_KV_EMBEDDING_SCALE,
126
- LLM_KV_TOKEN_SHIFT_COUNT,
127
- LLM_KV_INTERLEAVE_MOE_LAYER_STEP,
128
-
129
- LLM_KV_ATTENTION_HEAD_COUNT,
130
- LLM_KV_ATTENTION_HEAD_COUNT_KV,
131
- LLM_KV_ATTENTION_MAX_ALIBI_BIAS,
132
- LLM_KV_ATTENTION_CLAMP_KQV,
133
- LLM_KV_ATTENTION_KEY_LENGTH,
134
- LLM_KV_ATTENTION_VALUE_LENGTH,
135
- LLM_KV_ATTENTION_LAYERNORM_EPS,
136
- LLM_KV_ATTENTION_LAYERNORM_RMS_EPS,
137
- LLM_KV_ATTENTION_GROUPNORM_EPS,
138
- LLM_KV_ATTENTION_GROUPNORM_GROUPS,
139
- LLM_KV_ATTENTION_CAUSAL,
140
- LLM_KV_ATTENTION_Q_LORA_RANK,
141
- LLM_KV_ATTENTION_KV_LORA_RANK,
142
- LLM_KV_ATTENTION_DECAY_LORA_RANK,
143
- LLM_KV_ATTENTION_ICLR_LORA_RANK,
144
- LLM_KV_ATTENTION_VALUE_RESIDUAL_MIX_LORA_RANK,
145
- LLM_KV_ATTENTION_GATE_LORA_RANK,
146
- LLM_KV_ATTENTION_RELATIVE_BUCKETS_COUNT,
147
- LLM_KV_ATTENTION_SLIDING_WINDOW,
148
- LLM_KV_ATTENTION_SCALE,
149
- LLM_KV_ATTENTION_KEY_LENGTH_MLA,
150
- LLM_KV_ATTENTION_VALUE_LENGTH_MLA,
151
-
152
- LLM_KV_ROPE_DIMENSION_COUNT,
153
- LLM_KV_ROPE_DIMENSION_SECTIONS,
154
- LLM_KV_ROPE_FREQ_BASE,
155
- LLM_KV_ROPE_SCALE_LINEAR,
156
- LLM_KV_ROPE_SCALING_TYPE,
157
- LLM_KV_ROPE_SCALING_FACTOR,
158
- LLM_KV_ROPE_SCALING_ATTN_FACTOR,
159
- LLM_KV_ROPE_SCALING_ORIG_CTX_LEN,
160
- LLM_KV_ROPE_SCALING_FINETUNED,
161
- LLM_KV_ROPE_SCALING_YARN_LOG_MUL,
162
-
163
- LLM_KV_SPLIT_NO,
164
- LLM_KV_SPLIT_COUNT,
165
- LLM_KV_SPLIT_TENSORS_COUNT,
166
-
167
- LLM_KV_SSM_INNER_SIZE,
168
- LLM_KV_SSM_CONV_KERNEL,
169
- LLM_KV_SSM_STATE_SIZE,
170
- LLM_KV_SSM_TIME_STEP_RANK,
171
- LLM_KV_SSM_DT_B_C_RMS,
172
-
173
- LLM_KV_WKV_HEAD_SIZE,
174
-
175
- LLM_KV_TOKENIZER_MODEL,
176
- LLM_KV_TOKENIZER_PRE,
177
- LLM_KV_TOKENIZER_LIST,
178
- LLM_KV_TOKENIZER_TOKEN_TYPE,
179
- LLM_KV_TOKENIZER_TOKEN_TYPE_COUNT,
180
- LLM_KV_TOKENIZER_SCORES,
181
- LLM_KV_TOKENIZER_MERGES,
182
- LLM_KV_TOKENIZER_BOS_ID,
183
- LLM_KV_TOKENIZER_EOS_ID,
184
- LLM_KV_TOKENIZER_EOT_ID,
185
- LLM_KV_TOKENIZER_EOM_ID,
186
- LLM_KV_TOKENIZER_UNK_ID,
187
- LLM_KV_TOKENIZER_SEP_ID,
188
- LLM_KV_TOKENIZER_PAD_ID,
189
- LLM_KV_TOKENIZER_CLS_ID,
190
- LLM_KV_TOKENIZER_MASK_ID,
191
- LLM_KV_TOKENIZER_ADD_BOS,
192
- LLM_KV_TOKENIZER_ADD_EOS,
193
- LLM_KV_TOKENIZER_ADD_PREFIX,
194
- LLM_KV_TOKENIZER_REMOVE_EXTRA_WS,
195
- LLM_KV_TOKENIZER_PRECOMPILED_CHARSMAP,
196
- LLM_KV_TOKENIZER_HF_JSON,
197
- LLM_KV_TOKENIZER_RWKV,
198
- LLM_KV_TOKENIZER_CHAT_TEMPLATE,
199
- LLM_KV_TOKENIZER_CHAT_TEMPLATE_N,
200
- LLM_KV_TOKENIZER_FIM_PRE_ID,
201
- LLM_KV_TOKENIZER_FIM_SUF_ID,
202
- LLM_KV_TOKENIZER_FIM_MID_ID,
203
- LLM_KV_TOKENIZER_FIM_PAD_ID,
204
- LLM_KV_TOKENIZER_FIM_REP_ID,
205
- LLM_KV_TOKENIZER_FIM_SEP_ID,
206
-
207
- LLM_KV_ADAPTER_TYPE,
208
- LLM_KV_ADAPTER_LORA_ALPHA,
209
-
210
- LLM_KV_POSNET_EMBEDDING_LENGTH,
211
- LLM_KV_POSNET_BLOCK_COUNT,
212
-
213
- LLM_KV_CONVNEXT_EMBEDDING_LENGTH,
214
- LLM_KV_CONVNEXT_BLOCK_COUNT,
215
-
216
- // deprecated:
217
- LLM_KV_TOKENIZER_PREFIX_ID,
218
- LLM_KV_TOKENIZER_SUFFIX_ID,
219
- LLM_KV_TOKENIZER_MIDDLE_ID,
220
- };
221
-
222
- enum llm_tensor {
223
- LLM_TENSOR_TOKEN_EMBD,
224
- LLM_TENSOR_TOKEN_EMBD_NORM,
225
- LLM_TENSOR_TOKEN_TYPES,
226
- LLM_TENSOR_POS_EMBD,
227
- LLM_TENSOR_OUTPUT,
228
- LLM_TENSOR_OUTPUT_NORM,
229
- LLM_TENSOR_ROPE_FREQS,
230
- LLM_TENSOR_ROPE_FACTORS_LONG,
231
- LLM_TENSOR_ROPE_FACTORS_SHORT,
232
- LLM_TENSOR_ATTN_Q,
233
- LLM_TENSOR_ATTN_K,
234
- LLM_TENSOR_ATTN_V,
235
- LLM_TENSOR_ATTN_QKV,
236
- LLM_TENSOR_ATTN_OUT,
237
- LLM_TENSOR_ATTN_NORM,
238
- LLM_TENSOR_ATTN_NORM_2,
239
- LLM_TENSOR_ATTN_OUT_NORM,
240
- LLM_TENSOR_ATTN_POST_NORM,
241
- LLM_TENSOR_ATTN_ROT_EMBD,
242
- LLM_TENSOR_FFN_GATE_INP,
243
- LLM_TENSOR_FFN_GATE_INP_SHEXP,
244
- LLM_TENSOR_FFN_NORM,
245
- LLM_TENSOR_FFN_POST_NORM,
246
- LLM_TENSOR_FFN_GATE,
247
- LLM_TENSOR_FFN_DOWN,
248
- LLM_TENSOR_FFN_UP,
249
- LLM_TENSOR_FFN_ACT,
250
- LLM_TENSOR_FFN_DOWN_EXP, // split experts for backward compatibility
251
- LLM_TENSOR_FFN_GATE_EXP,
252
- LLM_TENSOR_FFN_UP_EXP,
253
- LLM_TENSOR_FFN_NORM_EXPS,
254
- LLM_TENSOR_FFN_DOWN_EXPS, // merged experts
255
- LLM_TENSOR_FFN_GATE_EXPS,
256
- LLM_TENSOR_FFN_UP_EXPS,
257
- LLM_TENSOR_FFN_DOWN_SHEXP,
258
- LLM_TENSOR_FFN_GATE_SHEXP,
259
- LLM_TENSOR_FFN_UP_SHEXP,
260
- LLM_TENSOR_FFN_EXP_PROBS_B,
261
- LLM_TENSOR_ATTN_Q_NORM,
262
- LLM_TENSOR_ATTN_K_NORM,
263
- LLM_TENSOR_LAYER_OUT_NORM,
264
- LLM_TENSOR_POST_ATTN_NORM,
265
- LLM_TENSOR_POST_MLP_NORM,
266
- LLM_TENSOR_SSM_IN,
267
- LLM_TENSOR_SSM_CONV1D,
268
- LLM_TENSOR_SSM_X,
269
- LLM_TENSOR_SSM_DT,
270
- LLM_TENSOR_SSM_A,
271
- LLM_TENSOR_SSM_D,
272
- LLM_TENSOR_SSM_OUT,
273
- LLM_TENSOR_TIME_MIX_W0,
274
- LLM_TENSOR_TIME_MIX_W1,
275
- LLM_TENSOR_TIME_MIX_W2,
276
- LLM_TENSOR_TIME_MIX_A0,
277
- LLM_TENSOR_TIME_MIX_A1,
278
- LLM_TENSOR_TIME_MIX_A2,
279
- LLM_TENSOR_TIME_MIX_V0,
280
- LLM_TENSOR_TIME_MIX_V1,
281
- LLM_TENSOR_TIME_MIX_V2,
282
- LLM_TENSOR_TIME_MIX_G1,
283
- LLM_TENSOR_TIME_MIX_G2,
284
- LLM_TENSOR_TIME_MIX_K_K,
285
- LLM_TENSOR_TIME_MIX_K_A,
286
- LLM_TENSOR_TIME_MIX_R_K,
287
- LLM_TENSOR_TIME_MIX_LERP_X,
288
- LLM_TENSOR_TIME_MIX_LERP_W,
289
- LLM_TENSOR_TIME_MIX_LERP_K,
290
- LLM_TENSOR_TIME_MIX_LERP_V,
291
- LLM_TENSOR_TIME_MIX_LERP_R,
292
- LLM_TENSOR_TIME_MIX_LERP_G,
293
- LLM_TENSOR_TIME_MIX_LERP_FUSED,
294
- LLM_TENSOR_TIME_MIX_FIRST,
295
- LLM_TENSOR_TIME_MIX_DECAY,
296
- LLM_TENSOR_TIME_MIX_DECAY_W1,
297
- LLM_TENSOR_TIME_MIX_DECAY_W2,
298
- LLM_TENSOR_TIME_MIX_KEY,
299
- LLM_TENSOR_TIME_MIX_VALUE,
300
- LLM_TENSOR_TIME_MIX_RECEPTANCE,
301
- LLM_TENSOR_TIME_MIX_GATE,
302
- LLM_TENSOR_TIME_MIX_LN,
303
- LLM_TENSOR_TIME_MIX_OUTPUT,
304
- LLM_TENSOR_CHANNEL_MIX_LERP_K,
305
- LLM_TENSOR_CHANNEL_MIX_LERP_R,
306
- LLM_TENSOR_CHANNEL_MIX_KEY,
307
- LLM_TENSOR_CHANNEL_MIX_RECEPTANCE,
308
- LLM_TENSOR_CHANNEL_MIX_VALUE,
309
- LLM_TENSOR_ATTN_Q_A,
310
- LLM_TENSOR_ATTN_Q_B,
311
- LLM_TENSOR_ATTN_KV_A_MQA,
312
- LLM_TENSOR_ATTN_KV_B,
313
- LLM_TENSOR_ATTN_K_B,
314
- LLM_TENSOR_ATTN_V_B,
315
- LLM_TENSOR_ATTN_Q_A_NORM,
316
- LLM_TENSOR_ATTN_KV_A_NORM,
317
- LLM_TENSOR_ATTN_SUB_NORM,
318
- LLM_TENSOR_FFN_SUB_NORM,
319
- LLM_TENSOR_DEC_ATTN_NORM,
320
- LLM_TENSOR_DEC_ATTN_Q,
321
- LLM_TENSOR_DEC_ATTN_K,
322
- LLM_TENSOR_DEC_ATTN_V,
323
- LLM_TENSOR_DEC_ATTN_OUT,
324
- LLM_TENSOR_DEC_ATTN_REL_B,
325
- LLM_TENSOR_DEC_CROSS_ATTN_NORM,
326
- LLM_TENSOR_DEC_CROSS_ATTN_Q,
327
- LLM_TENSOR_DEC_CROSS_ATTN_K,
328
- LLM_TENSOR_DEC_CROSS_ATTN_V,
329
- LLM_TENSOR_DEC_CROSS_ATTN_OUT,
330
- LLM_TENSOR_DEC_CROSS_ATTN_REL_B,
331
- LLM_TENSOR_DEC_FFN_NORM,
332
- LLM_TENSOR_DEC_FFN_GATE,
333
- LLM_TENSOR_DEC_FFN_DOWN,
334
- LLM_TENSOR_DEC_FFN_UP,
335
- LLM_TENSOR_DEC_OUTPUT_NORM,
336
- LLM_TENSOR_ENC_ATTN_NORM,
337
- LLM_TENSOR_ENC_ATTN_Q,
338
- LLM_TENSOR_ENC_ATTN_K,
339
- LLM_TENSOR_ENC_ATTN_V,
340
- LLM_TENSOR_ENC_ATTN_OUT,
341
- LLM_TENSOR_ENC_ATTN_REL_B,
342
- LLM_TENSOR_ENC_FFN_NORM,
343
- LLM_TENSOR_ENC_FFN_GATE,
344
- LLM_TENSOR_ENC_FFN_DOWN,
345
- LLM_TENSOR_ENC_FFN_UP,
346
- LLM_TENSOR_ENC_OUTPUT_NORM,
347
- LLM_TENSOR_CLS,
348
- LLM_TENSOR_CLS_OUT,
349
- LLM_TENSOR_CONV1D,
350
- LLM_TENSOR_CONVNEXT_DW,
351
- LLM_TENSOR_CONVNEXT_NORM,
352
- LLM_TENSOR_CONVNEXT_PW1,
353
- LLM_TENSOR_CONVNEXT_PW2,
354
- LLM_TENSOR_CONVNEXT_GAMMA,
355
- LLM_TENSOR_POS_NET_CONV1,
356
- LLM_TENSOR_POS_NET_CONV2,
357
- LLM_TENSOR_POS_NET_NORM,
358
- LLM_TENSOR_POS_NET_NORM1,
359
- LLM_TENSOR_POS_NET_NORM2,
360
- LLM_TENSOR_POS_NET_ATTN_NORM,
361
- LLM_TENSOR_POS_NET_ATTN_Q,
362
- LLM_TENSOR_POS_NET_ATTN_K,
363
- LLM_TENSOR_POS_NET_ATTN_V,
364
- LLM_TENSOR_POS_NET_ATTN_OUT,
365
- };
366
-
367
- enum llm_tensor_layer {
368
- LLM_TENSOR_LAYER_INPUT,
369
- LLM_TENSOR_LAYER_REPEATING,
370
- LLM_TENSOR_LAYER_OUTPUT,
371
- };
372
-
373
- struct LLM_KV {
374
- LLM_KV(llm_arch arch, const char * suffix = nullptr);
375
-
376
- llm_arch arch;
377
- const char * suffix;
378
-
379
- std::string operator()(llm_kv kv) const;
380
- };
381
-
382
- // helper to handle gguf constants
383
- // usage:
384
- //
385
- // const auto tn = LLM_TN(LLM_ARCH_LLAMA);
386
- //
387
- // std::string name = tn(LLM_TENSOR_OUTPUT); -> "output"
388
- // std::string name = tn(LLM_TENSOR_TOKEN_EMBD, "bias"); -> "token_embd.bias"
389
- // std::string name = tn(LLM_TENSOR_ATTN_NORM, "weight", 3); -> "blk.3.attn_norm.weight"
390
- //
391
- struct LLM_TN_IMPL {
392
- const llm_arch arch;
393
- const llm_tensor tensor;
394
- const char * const suffix;
395
- const int bid;
396
- const int xid;
397
-
398
- std::string str() const;
399
-
400
- operator std::string() const {
401
- return str();
402
- }
403
-
404
- friend bool operator==(const std::string & str, const LLM_TN_IMPL & tn) {
405
- return str == tn.str();
406
- }
407
-
408
- friend bool operator!=(const std::string & str, const LLM_TN_IMPL & tn) {
409
- return str != tn.str();
410
- }
411
- };
412
-
413
- struct LLM_TN {
414
- LLM_TN(llm_arch arch) : arch(arch) {}
415
-
416
- llm_arch arch;
417
-
418
- LLM_TN_IMPL operator()(llm_tensor tensor, const char * suffix, int bid = -1, int xid = -1) const {
419
- return { arch, tensor, suffix, bid, xid };
420
- }
421
-
422
- LLM_TN_IMPL operator()(llm_tensor tensor, int bid = -1, int xid = -1) const {
423
- return { arch, tensor, nullptr, bid, xid };
424
- }
425
- };
426
-
427
-
428
- struct llm_tensor_info {
429
- llm_tensor_layer layer;
430
- lm_ggml_op op;
431
- };
432
-
433
- const char * llm_arch_name(llm_arch arch);
434
-
435
- llm_arch llm_arch_from_string(const std::string & name);
436
-
437
- const llm_tensor_info & llm_tensor_info_for(llm_tensor tensor);
@@ -1,89 +0,0 @@
1
- #pragma once
2
-
3
- #include "llama.h"
4
-
5
- #include <array>
6
- #include <vector>
7
-
8
- // very similar to llama_batch,
9
- // but has more metadata about sequences
10
- struct llama_ubatch {
11
- bool equal_seqs;
12
- // TODO: whole_seqs for embeddings?
13
-
14
- uint32_t n_tokens; // total tokens (n_seq_tokens * n_seqs)
15
- uint32_t n_seq_tokens; // tokens per sequence
16
- uint32_t n_seqs;
17
-
18
- llama_token * token; // [n_tokens]
19
- float * embd; // [n_embd, n_tokens]
20
- llama_pos * pos; // [n_tokens]
21
- int32_t * n_seq_id; // [n_seqs]
22
- llama_seq_id ** seq_id; // [n_seqs]
23
- int8_t * output; // [n_tokens]
24
- };
25
-
26
- struct llama_sbatch_seq {
27
- int32_t n_seq_id;
28
-
29
- llama_seq_id * seq_id;
30
-
31
- size_t offset;
32
- size_t length;
33
- };
34
-
35
- // sequence-length-aware batch splitting
36
- struct llama_sbatch {
37
- // tokens left in this batch
38
- size_t n_tokens;
39
-
40
- size_t n_embd;
41
-
42
- bool logits_all; // TODO: remove once lctx.logits_all is removed too
43
-
44
- // sorted indices into the batch
45
- std::vector<int64_t> ids;
46
- // batch indices of the output
47
- std::vector<int64_t> out_ids;
48
- std::vector<llama_sbatch_seq> seq;
49
-
50
- const llama_batch * batch = nullptr;
51
-
52
- // buffers for the ubatch
53
- std::vector<llama_token> ubatch_token;
54
- std::vector<float> ubatch_embd;
55
- std::vector<llama_pos> ubatch_pos;
56
- std::vector<int32_t> ubatch_n_seq_id;
57
- std::vector<llama_seq_id *> ubatch_seq_id;
58
- std::vector<int8_t> ubatch_output;
59
-
60
- llama_ubatch reserve_ubatch(size_t n_ubatch, bool has_embd = false);
61
-
62
- void add_seq_to_ubatch(llama_ubatch & ubatch, llama_sbatch_seq & seq, size_t length);
63
-
64
- // simple split, unknown number of sequences of unequal lengths
65
- llama_ubatch split_simple(size_t n_ubatch);
66
-
67
- // make batches of equal-length sequences
68
- llama_ubatch split_equal(size_t n_ubatch);
69
-
70
- // sequence-wise split
71
- llama_ubatch split_seq(size_t n_ubatch);
72
-
73
- llama_sbatch() = default;
74
- llama_sbatch(const llama_batch & batch, size_t n_embd, bool simple_split = false, bool logits_all = false);
75
- };
76
-
77
- // temporary allocate memory for the input batch if needed
78
- struct llama_batch_allocr {
79
- struct llama_batch batch;
80
-
81
- std::array<llama_seq_id, 1> seq_id_0 = { 0 }; // default sequence id
82
- std::vector<llama_pos> pos;
83
- std::vector<int32_t> n_seq_id;
84
- std::vector<llama_seq_id *> seq_id;
85
- std::vector<int8_t> logits;
86
-
87
- // optionally fulfill the batch returned by llama_batch_get_one
88
- llama_batch_allocr(struct llama_batch in_batch, llama_pos p0);
89
- };
@@ -1,58 +0,0 @@
1
- #pragma once
2
-
3
- #include <string>
4
- #include <vector>
5
- #include <cstdint>
6
-
7
- enum llm_chat_template {
8
- LLM_CHAT_TEMPLATE_CHATML,
9
- LLM_CHAT_TEMPLATE_LLAMA_2,
10
- LLM_CHAT_TEMPLATE_LLAMA_2_SYS,
11
- LLM_CHAT_TEMPLATE_LLAMA_2_SYS_BOS,
12
- LLM_CHAT_TEMPLATE_LLAMA_2_SYS_STRIP,
13
- LLM_CHAT_TEMPLATE_MISTRAL_V1,
14
- LLM_CHAT_TEMPLATE_MISTRAL_V3,
15
- LLM_CHAT_TEMPLATE_MISTRAL_V3_TEKKEN,
16
- LLM_CHAT_TEMPLATE_MISTRAL_V7,
17
- LLM_CHAT_TEMPLATE_MISTRAL_V7_TEKKEN,
18
- LLM_CHAT_TEMPLATE_PHI_3,
19
- LLM_CHAT_TEMPLATE_PHI_4,
20
- LLM_CHAT_TEMPLATE_FALCON_3,
21
- LLM_CHAT_TEMPLATE_ZEPHYR,
22
- LLM_CHAT_TEMPLATE_MONARCH,
23
- LLM_CHAT_TEMPLATE_GEMMA,
24
- LLM_CHAT_TEMPLATE_ORION,
25
- LLM_CHAT_TEMPLATE_OPENCHAT,
26
- LLM_CHAT_TEMPLATE_VICUNA,
27
- LLM_CHAT_TEMPLATE_VICUNA_ORCA,
28
- LLM_CHAT_TEMPLATE_DEEPSEEK,
29
- LLM_CHAT_TEMPLATE_DEEPSEEK_2,
30
- LLM_CHAT_TEMPLATE_DEEPSEEK_3,
31
- LLM_CHAT_TEMPLATE_COMMAND_R,
32
- LLM_CHAT_TEMPLATE_LLAMA_3,
33
- LLM_CHAT_TEMPLATE_CHATGLM_3,
34
- LLM_CHAT_TEMPLATE_CHATGLM_4,
35
- LLM_CHAT_TEMPLATE_GLMEDGE,
36
- LLM_CHAT_TEMPLATE_MINICPM,
37
- LLM_CHAT_TEMPLATE_EXAONE_3,
38
- LLM_CHAT_TEMPLATE_RWKV_WORLD,
39
- LLM_CHAT_TEMPLATE_GRANITE,
40
- LLM_CHAT_TEMPLATE_GIGACHAT,
41
- LLM_CHAT_TEMPLATE_MEGREZ,
42
- LLM_CHAT_TEMPLATE_YANDEX,
43
- LLM_CHAT_TEMPLATE_BAILING,
44
- LLM_CHAT_TEMPLATE_LLAMA4,
45
- LLM_CHAT_TEMPLATE_SMOLVLM,
46
- LLM_CHAT_TEMPLATE_UNKNOWN,
47
- };
48
-
49
- struct llama_chat_message;
50
-
51
- llm_chat_template llm_chat_template_from_str(const std::string & name);
52
-
53
- llm_chat_template llm_chat_detect_template(const std::string & tmpl);
54
-
55
- int32_t llm_chat_apply_template(
56
- llm_chat_template tmpl,
57
- const std::vector<const llama_chat_message *> & chat,
58
- std::string & dest, bool add_ass);