cactus-react-native 0.2.11 → 1.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (510) hide show
  1. package/Cactus.podspec +34 -0
  2. package/LICENSE +38 -0
  3. package/README.md +354 -69
  4. package/android/CMakeLists.txt +40 -0
  5. package/android/build.gradle +68 -44
  6. package/android/gradle.properties +5 -5
  7. package/android/src/main/AndroidManifest.xml +1 -3
  8. package/android/src/main/cpp/cpp-adapter.cpp +6 -0
  9. package/android/src/main/java/com/margelo/nitro/cactus/CactusPackage.kt +22 -0
  10. package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusCrypto.kt +38 -0
  11. package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusDeviceInfo.kt +24 -0
  12. package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusFileSystem.kt +227 -0
  13. package/android/src/main/jniLibs/arm64-v8a/{libcactus_v8_2_dotprod.so → libcactus.a} +0 -0
  14. package/android/src/main/jniLibs/arm64-v8a/libcactus_util.so +0 -0
  15. package/cpp/HybridCactus.cpp +123 -0
  16. package/cpp/HybridCactus.hpp +35 -0
  17. package/cpp/HybridCactusUtil.cpp +45 -0
  18. package/cpp/HybridCactusUtil.hpp +26 -0
  19. package/cpp/cactus_ffi.h +55 -0
  20. package/cpp/cactus_util.h +25 -0
  21. package/ios/HybridCactusCrypto.swift +37 -0
  22. package/ios/HybridCactusDeviceInfo.swift +32 -0
  23. package/ios/HybridCactusFileSystem.swift +234 -0
  24. package/ios/cactus.xcframework/{info.plist → Info.plist} +2 -37
  25. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/cactus.h +8 -229
  26. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/cactus_ffi.h +28 -229
  27. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/engine.h +347 -0
  28. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ffi_utils.h +286 -0
  29. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/graph.h +319 -0
  30. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/kernel.h +254 -0
  31. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/kernel_utils.h +343 -0
  32. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Info.plist +0 -0
  33. package/ios/cactus.xcframework/ios-arm64/cactus.framework/cactus +0 -0
  34. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/cactus.h +11 -0
  35. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/cactus_ffi.h +55 -0
  36. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/engine.h +347 -0
  37. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/ffi_utils.h +286 -0
  38. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/graph.h +319 -0
  39. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/kernel.h +254 -0
  40. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/kernel_utils.h +343 -0
  41. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Info.plist +0 -0
  42. package/ios/cactus.xcframework/{tvos-arm64_x86_64-simulator → ios-arm64-simulator}/cactus.framework/_CodeSignature/CodeResources +1 -1
  43. package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/cactus +0 -0
  44. package/ios/cactus_util.xcframework/Info.plist +39 -0
  45. package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/cactus_util.h +25 -0
  46. package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/ios_utils.h +10 -0
  47. package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/logging.h +25 -0
  48. package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Info.plist +0 -0
  49. package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/cactus_util +0 -0
  50. package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/cactus_util.h +25 -0
  51. package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/ios_utils.h +10 -0
  52. package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/logging.h +25 -0
  53. package/ios/{cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework → cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework}/Info.plist +0 -0
  54. package/ios/{cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework → cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework}/_CodeSignature/CodeResources +36 -2
  55. package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/cactus_util +0 -0
  56. package/lib/module/api/Database.js +60 -0
  57. package/lib/module/api/Database.js.map +1 -0
  58. package/lib/module/classes/CactusLM.js +149 -0
  59. package/lib/module/classes/CactusLM.js.map +1 -0
  60. package/lib/module/config/CactusConfig.js +6 -0
  61. package/lib/module/config/CactusConfig.js.map +1 -0
  62. package/lib/module/constants/packageVersion.js +4 -0
  63. package/lib/module/constants/packageVersion.js.map +1 -0
  64. package/lib/module/hooks/useCactusLM.js +233 -0
  65. package/lib/module/hooks/useCactusLM.js.map +1 -0
  66. package/lib/module/index.js +9 -409
  67. package/lib/module/index.js.map +1 -1
  68. package/lib/module/native/Cactus.js +50 -0
  69. package/lib/module/native/Cactus.js.map +1 -0
  70. package/lib/module/native/CactusCrypto.js +10 -0
  71. package/lib/module/native/CactusCrypto.js.map +1 -0
  72. package/lib/module/native/CactusDeviceInfo.js +13 -0
  73. package/lib/module/native/CactusDeviceInfo.js.map +1 -0
  74. package/lib/module/native/CactusFileSystem.js +35 -0
  75. package/lib/module/native/CactusFileSystem.js.map +1 -0
  76. package/lib/module/native/CactusUtil.js +23 -0
  77. package/lib/module/native/CactusUtil.js.map +1 -0
  78. package/lib/module/native/index.js +8 -0
  79. package/lib/module/native/index.js.map +1 -0
  80. package/lib/module/specs/Cactus.nitro.js +4 -0
  81. package/lib/module/specs/Cactus.nitro.js.map +1 -0
  82. package/lib/module/specs/CactusCrypto.nitro.js +4 -0
  83. package/lib/module/specs/CactusCrypto.nitro.js.map +1 -0
  84. package/lib/module/specs/CactusDeviceInfo.nitro.js +4 -0
  85. package/lib/module/specs/CactusDeviceInfo.nitro.js.map +1 -0
  86. package/lib/module/specs/CactusFileSystem.nitro.js +4 -0
  87. package/lib/module/specs/CactusFileSystem.nitro.js.map +1 -0
  88. package/lib/module/specs/CactusUtil.nitro.js +4 -0
  89. package/lib/module/specs/CactusUtil.nitro.js.map +1 -0
  90. package/lib/module/telemetry/Telemetry.js +100 -0
  91. package/lib/module/telemetry/Telemetry.js.map +1 -0
  92. package/lib/module/types/CactusLM.js +2 -0
  93. package/lib/module/types/CactusLM.js.map +1 -0
  94. package/lib/module/types/CactusModel.js +2 -0
  95. package/lib/module/types/CactusModel.js.map +1 -0
  96. package/lib/module/utils/error.js +4 -0
  97. package/lib/module/utils/error.js.map +1 -0
  98. package/lib/typescript/package.json +1 -0
  99. package/lib/typescript/src/api/Database.d.ts +11 -0
  100. package/lib/typescript/src/api/Database.d.ts.map +1 -0
  101. package/lib/typescript/src/classes/CactusLM.d.ts +25 -0
  102. package/lib/typescript/src/classes/CactusLM.d.ts.map +1 -0
  103. package/lib/typescript/src/config/CactusConfig.d.ts +5 -0
  104. package/lib/typescript/src/config/CactusConfig.d.ts.map +1 -0
  105. package/lib/typescript/src/constants/packageVersion.d.ts +2 -0
  106. package/lib/typescript/src/constants/packageVersion.d.ts.map +1 -0
  107. package/lib/typescript/src/hooks/useCactusLM.d.ts +20 -0
  108. package/lib/typescript/src/hooks/useCactusLM.d.ts.map +1 -0
  109. package/lib/typescript/src/index.d.ts +6 -0
  110. package/lib/typescript/src/index.d.ts.map +1 -0
  111. package/lib/typescript/src/native/Cactus.d.ts +11 -0
  112. package/lib/typescript/src/native/Cactus.d.ts.map +1 -0
  113. package/lib/typescript/src/native/CactusCrypto.d.ts +5 -0
  114. package/lib/typescript/src/native/CactusCrypto.d.ts.map +1 -0
  115. package/lib/typescript/src/native/CactusDeviceInfo.d.ts +7 -0
  116. package/lib/typescript/src/native/CactusDeviceInfo.d.ts.map +1 -0
  117. package/lib/typescript/src/native/CactusFileSystem.d.ts +13 -0
  118. package/lib/typescript/src/native/CactusFileSystem.d.ts.map +1 -0
  119. package/lib/typescript/src/native/CactusUtil.d.ts +6 -0
  120. package/lib/typescript/src/native/CactusUtil.d.ts.map +1 -0
  121. package/lib/typescript/src/native/index.d.ts +6 -0
  122. package/lib/typescript/src/native/index.d.ts.map +1 -0
  123. package/lib/typescript/src/specs/Cactus.nitro.d.ts +13 -0
  124. package/lib/typescript/src/specs/Cactus.nitro.d.ts.map +1 -0
  125. package/lib/typescript/src/specs/CactusCrypto.nitro.d.ts +8 -0
  126. package/lib/typescript/src/specs/CactusCrypto.nitro.d.ts.map +1 -0
  127. package/lib/typescript/src/specs/CactusDeviceInfo.nitro.d.ts +16 -0
  128. package/lib/typescript/src/specs/CactusDeviceInfo.nitro.d.ts.map +1 -0
  129. package/lib/typescript/src/specs/CactusFileSystem.nitro.d.ts +16 -0
  130. package/lib/typescript/src/specs/CactusFileSystem.nitro.d.ts.map +1 -0
  131. package/lib/typescript/src/specs/CactusUtil.nitro.d.ts +10 -0
  132. package/lib/typescript/src/specs/CactusUtil.nitro.d.ts.map +1 -0
  133. package/lib/typescript/src/telemetry/Telemetry.d.ts +30 -0
  134. package/lib/typescript/src/telemetry/Telemetry.d.ts.map +1 -0
  135. package/lib/typescript/src/types/CactusLM.d.ts +65 -0
  136. package/lib/typescript/src/types/CactusLM.d.ts.map +1 -0
  137. package/lib/typescript/src/types/CactusModel.d.ts +12 -0
  138. package/lib/typescript/src/types/CactusModel.d.ts.map +1 -0
  139. package/lib/typescript/src/utils/error.d.ts +2 -0
  140. package/lib/typescript/src/utils/error.d.ts.map +1 -0
  141. package/nitro.json +31 -0
  142. package/nitrogen/generated/android/c++/JDeviceInfo.hpp +74 -0
  143. package/nitrogen/generated/android/c++/JFunc_void_double.hpp +74 -0
  144. package/nitrogen/generated/android/c++/JHybridCactusCryptoSpec.cpp +65 -0
  145. package/nitrogen/generated/android/c++/JHybridCactusCryptoSpec.hpp +65 -0
  146. package/nitrogen/generated/android/c++/JHybridCactusDeviceInfoSpec.cpp +85 -0
  147. package/nitrogen/generated/android/c++/JHybridCactusDeviceInfoSpec.hpp +66 -0
  148. package/nitrogen/generated/android/c++/JHybridCactusFileSystemSpec.cpp +192 -0
  149. package/nitrogen/generated/android/c++/JHybridCactusFileSystemSpec.hpp +73 -0
  150. package/nitrogen/generated/android/cactus+autolinking.cmake +87 -0
  151. package/nitrogen/generated/android/cactus+autolinking.gradle +27 -0
  152. package/nitrogen/generated/android/cactusOnLoad.cpp +86 -0
  153. package/nitrogen/generated/android/cactusOnLoad.hpp +25 -0
  154. package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/DeviceInfo.kt +50 -0
  155. package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/Func_void_double.kt +80 -0
  156. package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusCryptoSpec.kt +58 -0
  157. package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusDeviceInfoSpec.kt +62 -0
  158. package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusFileSystemSpec.kt +95 -0
  159. package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/cactusOnLoad.kt +35 -0
  160. package/nitrogen/generated/ios/Cactus+autolinking.rb +60 -0
  161. package/nitrogen/generated/ios/Cactus-Swift-Cxx-Bridge.cpp +122 -0
  162. package/nitrogen/generated/ios/Cactus-Swift-Cxx-Bridge.hpp +373 -0
  163. package/nitrogen/generated/ios/Cactus-Swift-Cxx-Umbrella.hpp +60 -0
  164. package/nitrogen/generated/ios/CactusAutolinking.mm +69 -0
  165. package/nitrogen/generated/ios/CactusAutolinking.swift +55 -0
  166. package/nitrogen/generated/ios/c++/HybridCactusCryptoSpecSwift.cpp +11 -0
  167. package/nitrogen/generated/ios/c++/HybridCactusCryptoSpecSwift.hpp +77 -0
  168. package/nitrogen/generated/ios/c++/HybridCactusDeviceInfoSpecSwift.cpp +11 -0
  169. package/nitrogen/generated/ios/c++/HybridCactusDeviceInfoSpecSwift.hpp +88 -0
  170. package/nitrogen/generated/ios/c++/HybridCactusFileSystemSpecSwift.cpp +11 -0
  171. package/nitrogen/generated/ios/c++/HybridCactusFileSystemSpecSwift.hpp +143 -0
  172. package/nitrogen/generated/ios/swift/DeviceInfo.swift +98 -0
  173. package/nitrogen/generated/ios/swift/Func_void.swift +47 -0
  174. package/nitrogen/generated/ios/swift/Func_void_DeviceInfo.swift +47 -0
  175. package/nitrogen/generated/ios/swift/Func_void_bool.swift +47 -0
  176. package/nitrogen/generated/ios/swift/Func_void_double.swift +47 -0
  177. package/nitrogen/generated/ios/swift/Func_void_std__exception_ptr.swift +47 -0
  178. package/nitrogen/generated/ios/swift/Func_void_std__optional_std__string_.swift +54 -0
  179. package/nitrogen/generated/ios/swift/Func_void_std__string.swift +47 -0
  180. package/nitrogen/generated/ios/swift/HybridCactusCryptoSpec.swift +57 -0
  181. package/nitrogen/generated/ios/swift/HybridCactusCryptoSpec_cxx.swift +139 -0
  182. package/nitrogen/generated/ios/swift/HybridCactusDeviceInfoSpec.swift +58 -0
  183. package/nitrogen/generated/ios/swift/HybridCactusDeviceInfoSpec_cxx.swift +164 -0
  184. package/nitrogen/generated/ios/swift/HybridCactusFileSystemSpec.swift +65 -0
  185. package/nitrogen/generated/ios/swift/HybridCactusFileSystemSpec_cxx.swift +303 -0
  186. package/nitrogen/generated/shared/c++/DeviceInfo.hpp +92 -0
  187. package/nitrogen/generated/shared/c++/HybridCactusCryptoSpec.cpp +21 -0
  188. package/nitrogen/generated/shared/c++/HybridCactusCryptoSpec.hpp +63 -0
  189. package/nitrogen/generated/shared/c++/HybridCactusDeviceInfoSpec.cpp +22 -0
  190. package/nitrogen/generated/shared/c++/HybridCactusDeviceInfoSpec.hpp +67 -0
  191. package/nitrogen/generated/shared/c++/HybridCactusFileSystemSpec.cpp +29 -0
  192. package/nitrogen/generated/shared/c++/HybridCactusFileSystemSpec.hpp +73 -0
  193. package/nitrogen/generated/shared/c++/HybridCactusSpec.cpp +26 -0
  194. package/nitrogen/generated/shared/c++/HybridCactusSpec.hpp +71 -0
  195. package/nitrogen/generated/shared/c++/HybridCactusUtilSpec.cpp +23 -0
  196. package/nitrogen/generated/shared/c++/HybridCactusUtilSpec.hpp +66 -0
  197. package/package.json +84 -143
  198. package/src/api/Database.ts +83 -0
  199. package/src/classes/CactusLM.ts +203 -0
  200. package/src/config/CactusConfig.ts +4 -0
  201. package/src/constants/packageVersion.ts +1 -0
  202. package/src/hooks/useCactusLM.ts +282 -0
  203. package/src/index.tsx +23 -0
  204. package/src/native/Cactus.ts +79 -0
  205. package/src/native/CactusCrypto.ts +11 -0
  206. package/src/native/CactusDeviceInfo.ts +18 -0
  207. package/src/native/CactusFileSystem.ts +47 -0
  208. package/src/native/CactusUtil.ts +27 -0
  209. package/src/native/index.ts +5 -0
  210. package/src/specs/Cactus.nitro.ts +16 -0
  211. package/src/specs/CactusCrypto.nitro.ts +6 -0
  212. package/src/specs/CactusDeviceInfo.nitro.ts +15 -0
  213. package/src/specs/CactusFileSystem.nitro.ts +21 -0
  214. package/src/specs/CactusUtil.nitro.ts +8 -0
  215. package/src/telemetry/Telemetry.ts +159 -0
  216. package/src/types/CactusLM.ts +71 -0
  217. package/src/types/CactusModel.ts +14 -0
  218. package/src/utils/error.ts +2 -0
  219. package/LICENSE.txt +0 -20
  220. package/android/src/main/CMakeLists.txt +0 -140
  221. package/android/src/main/java/com/cactus/Cactus.java +0 -1190
  222. package/android/src/main/java/com/cactus/CactusPackage.java +0 -48
  223. package/android/src/main/java/com/cactus/LlamaContext.java +0 -748
  224. package/android/src/main/jni-utils.h +0 -100
  225. package/android/src/main/jni.cpp +0 -1605
  226. package/android/src/main/jniLibs/arm64-v8a/libcactus.so +0 -0
  227. package/android/src/main/jniLibs/arm64-v8a/libcactus_v8.so +0 -0
  228. package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2.so +0 -0
  229. package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2_dotprod_i8mm.so +0 -0
  230. package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2_i8mm.so +0 -0
  231. package/android/src/newarch/java/com/cactus/CactusModule.java +0 -204
  232. package/android/src/oldarch/java/com/cactus/CactusModule.java +0 -205
  233. package/cactus-react-native.podspec +0 -42
  234. package/ios/CMakeLists.txt +0 -131
  235. package/ios/Cactus.h +0 -6
  236. package/ios/Cactus.mm +0 -681
  237. package/ios/CactusContext.h +0 -81
  238. package/ios/CactusContext.mm +0 -1032
  239. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/chat.h +0 -145
  240. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/common.h +0 -674
  241. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-alloc.h +0 -76
  242. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-backend-impl.h +0 -255
  243. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-backend.h +0 -354
  244. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-common.h +0 -1857
  245. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-cpp.h +0 -39
  246. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-cpu.h +0 -143
  247. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-impl.h +0 -601
  248. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-metal-impl.h +0 -622
  249. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-metal.h +0 -66
  250. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-opt.h +0 -237
  251. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-quants.h +0 -100
  252. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-threading.h +0 -14
  253. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml.h +0 -2202
  254. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/gguf.h +0 -202
  255. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
  256. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/json.hpp +0 -24766
  257. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-adapter.h +0 -76
  258. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-arch.h +0 -437
  259. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-batch.h +0 -89
  260. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-chat.h +0 -58
  261. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-context.h +0 -276
  262. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-cparams.h +0 -39
  263. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-cpp.h +0 -30
  264. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-grammar.h +0 -173
  265. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-graph.h +0 -640
  266. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-hparams.h +0 -190
  267. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-impl.h +0 -61
  268. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-io.h +0 -35
  269. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-kv-cache.h +0 -515
  270. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-memory.h +0 -32
  271. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-mmap.h +0 -68
  272. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-model-loader.h +0 -169
  273. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-model-saver.h +0 -37
  274. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-model.h +0 -425
  275. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-sampling.h +0 -32
  276. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-vocab.h +0 -131
  277. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama.h +0 -1376
  278. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/log.h +0 -103
  279. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/minja/chat-template.hpp +0 -542
  280. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/minja/minja.hpp +0 -2974
  281. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/sampling.h +0 -107
  282. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/unicode-data.h +0 -20
  283. package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/unicode.h +0 -66
  284. package/ios/cactus.xcframework/ios-arm64/cactus.framework/ggml-llama.metallib +0 -0
  285. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/cactus.h +0 -232
  286. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/cactus_ffi.h +0 -256
  287. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/chat.h +0 -145
  288. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/common.h +0 -674
  289. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-alloc.h +0 -76
  290. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend-impl.h +0 -255
  291. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend.h +0 -354
  292. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-common.h +0 -1857
  293. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpp.h +0 -39
  294. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpu.h +0 -143
  295. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-impl.h +0 -601
  296. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal-impl.h +0 -622
  297. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal.h +0 -66
  298. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-opt.h +0 -237
  299. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-quants.h +0 -100
  300. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-threading.h +0 -14
  301. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml.h +0 -2202
  302. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/gguf.h +0 -202
  303. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
  304. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/json.hpp +0 -24766
  305. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-adapter.h +0 -76
  306. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-arch.h +0 -437
  307. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-batch.h +0 -89
  308. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-chat.h +0 -58
  309. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-context.h +0 -276
  310. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-cparams.h +0 -39
  311. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-cpp.h +0 -30
  312. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-grammar.h +0 -173
  313. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-graph.h +0 -640
  314. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-hparams.h +0 -190
  315. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-impl.h +0 -61
  316. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-io.h +0 -35
  317. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-kv-cache.h +0 -515
  318. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-memory.h +0 -32
  319. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-mmap.h +0 -68
  320. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-loader.h +0 -169
  321. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-saver.h +0 -37
  322. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-model.h +0 -425
  323. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-sampling.h +0 -32
  324. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-vocab.h +0 -131
  325. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama.h +0 -1376
  326. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/log.h +0 -103
  327. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/minja/chat-template.hpp +0 -542
  328. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/minja/minja.hpp +0 -2974
  329. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/sampling.h +0 -107
  330. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/unicode-data.h +0 -20
  331. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/unicode.h +0 -66
  332. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/cactus +0 -0
  333. package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/ggml-llama-sim.metallib +0 -0
  334. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/cactus.h +0 -232
  335. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/cactus_ffi.h +0 -256
  336. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/chat.h +0 -145
  337. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/common.h +0 -674
  338. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-alloc.h +0 -76
  339. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-backend-impl.h +0 -255
  340. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-backend.h +0 -354
  341. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-common.h +0 -1857
  342. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-cpp.h +0 -39
  343. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-cpu.h +0 -143
  344. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-impl.h +0 -601
  345. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-metal-impl.h +0 -622
  346. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-metal.h +0 -66
  347. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-opt.h +0 -237
  348. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-quants.h +0 -100
  349. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-threading.h +0 -14
  350. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml.h +0 -2202
  351. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/gguf.h +0 -202
  352. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
  353. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/json.hpp +0 -24766
  354. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-adapter.h +0 -76
  355. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-arch.h +0 -437
  356. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-batch.h +0 -89
  357. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-chat.h +0 -58
  358. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-context.h +0 -276
  359. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-cparams.h +0 -39
  360. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-cpp.h +0 -30
  361. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-grammar.h +0 -173
  362. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-graph.h +0 -640
  363. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-hparams.h +0 -190
  364. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-impl.h +0 -61
  365. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-io.h +0 -35
  366. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-kv-cache.h +0 -515
  367. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-memory.h +0 -32
  368. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-mmap.h +0 -68
  369. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-model-loader.h +0 -169
  370. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-model-saver.h +0 -37
  371. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-model.h +0 -425
  372. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-sampling.h +0 -32
  373. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-vocab.h +0 -131
  374. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama.h +0 -1376
  375. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/log.h +0 -103
  376. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/minja/chat-template.hpp +0 -542
  377. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/minja/minja.hpp +0 -2974
  378. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/sampling.h +0 -107
  379. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/unicode-data.h +0 -20
  380. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/unicode.h +0 -66
  381. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Info.plist +0 -0
  382. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/cactus +0 -0
  383. package/ios/cactus.xcframework/tvos-arm64/cactus.framework/ggml-llama.metallib +0 -0
  384. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/cactus.h +0 -232
  385. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/cactus_ffi.h +0 -256
  386. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/chat.h +0 -145
  387. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/common.h +0 -674
  388. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-alloc.h +0 -76
  389. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend-impl.h +0 -255
  390. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend.h +0 -354
  391. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-common.h +0 -1857
  392. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpp.h +0 -39
  393. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpu.h +0 -143
  394. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-impl.h +0 -601
  395. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal-impl.h +0 -622
  396. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal.h +0 -66
  397. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-opt.h +0 -237
  398. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-quants.h +0 -100
  399. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-threading.h +0 -14
  400. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml.h +0 -2202
  401. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/gguf.h +0 -202
  402. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
  403. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/json.hpp +0 -24766
  404. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-adapter.h +0 -76
  405. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-arch.h +0 -437
  406. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-batch.h +0 -89
  407. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-chat.h +0 -58
  408. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-context.h +0 -276
  409. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-cparams.h +0 -39
  410. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-cpp.h +0 -30
  411. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-grammar.h +0 -173
  412. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-graph.h +0 -640
  413. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-hparams.h +0 -190
  414. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-impl.h +0 -61
  415. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-io.h +0 -35
  416. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-kv-cache.h +0 -515
  417. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-memory.h +0 -32
  418. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-mmap.h +0 -68
  419. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-loader.h +0 -169
  420. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-saver.h +0 -37
  421. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-model.h +0 -425
  422. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-sampling.h +0 -32
  423. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-vocab.h +0 -131
  424. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama.h +0 -1376
  425. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/log.h +0 -103
  426. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/minja/chat-template.hpp +0 -542
  427. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/minja/minja.hpp +0 -2974
  428. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/sampling.h +0 -107
  429. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/unicode-data.h +0 -20
  430. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/unicode.h +0 -66
  431. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Info.plist +0 -0
  432. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/cactus +0 -0
  433. package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/ggml-llama-sim.metallib +0 -0
  434. package/lib/commonjs/NativeCactus.js +0 -9
  435. package/lib/commonjs/NativeCactus.js.map +0 -1
  436. package/lib/commonjs/agent.js +0 -73
  437. package/lib/commonjs/agent.js.map +0 -1
  438. package/lib/commonjs/chat.js +0 -73
  439. package/lib/commonjs/chat.js.map +0 -1
  440. package/lib/commonjs/index.js +0 -523
  441. package/lib/commonjs/index.js.map +0 -1
  442. package/lib/commonjs/lm.js +0 -272
  443. package/lib/commonjs/lm.js.map +0 -1
  444. package/lib/commonjs/package.json +0 -1
  445. package/lib/commonjs/projectId.js +0 -9
  446. package/lib/commonjs/projectId.js.map +0 -1
  447. package/lib/commonjs/remote.js +0 -100
  448. package/lib/commonjs/remote.js.map +0 -1
  449. package/lib/commonjs/telemetry.js +0 -102
  450. package/lib/commonjs/telemetry.js.map +0 -1
  451. package/lib/commonjs/tools.js +0 -72
  452. package/lib/commonjs/tools.js.map +0 -1
  453. package/lib/commonjs/tts.js +0 -141
  454. package/lib/commonjs/tts.js.map +0 -1
  455. package/lib/commonjs/vlm.js +0 -221
  456. package/lib/commonjs/vlm.js.map +0 -1
  457. package/lib/module/NativeCactus.js +0 -5
  458. package/lib/module/NativeCactus.js.map +0 -1
  459. package/lib/module/agent.js +0 -68
  460. package/lib/module/agent.js.map +0 -1
  461. package/lib/module/chat.js +0 -67
  462. package/lib/module/chat.js.map +0 -1
  463. package/lib/module/lm.js +0 -267
  464. package/lib/module/lm.js.map +0 -1
  465. package/lib/module/projectId.js +0 -5
  466. package/lib/module/projectId.js.map +0 -1
  467. package/lib/module/remote.js +0 -91
  468. package/lib/module/remote.js.map +0 -1
  469. package/lib/module/telemetry.js +0 -97
  470. package/lib/module/telemetry.js.map +0 -1
  471. package/lib/module/tools.js +0 -66
  472. package/lib/module/tools.js.map +0 -1
  473. package/lib/module/tts.js +0 -135
  474. package/lib/module/tts.js.map +0 -1
  475. package/lib/module/vlm.js +0 -216
  476. package/lib/module/vlm.js.map +0 -1
  477. package/lib/typescript/NativeCactus.d.ts +0 -252
  478. package/lib/typescript/NativeCactus.d.ts.map +0 -1
  479. package/lib/typescript/agent.d.ts +0 -31
  480. package/lib/typescript/agent.d.ts.map +0 -1
  481. package/lib/typescript/chat.d.ts +0 -23
  482. package/lib/typescript/chat.d.ts.map +0 -1
  483. package/lib/typescript/index.d.ts +0 -114
  484. package/lib/typescript/index.d.ts.map +0 -1
  485. package/lib/typescript/lm.d.ts +0 -36
  486. package/lib/typescript/lm.d.ts.map +0 -1
  487. package/lib/typescript/projectId.d.ts +0 -2
  488. package/lib/typescript/projectId.d.ts.map +0 -1
  489. package/lib/typescript/remote.d.ts +0 -8
  490. package/lib/typescript/remote.d.ts.map +0 -1
  491. package/lib/typescript/telemetry.d.ts +0 -25
  492. package/lib/typescript/telemetry.d.ts.map +0 -1
  493. package/lib/typescript/tools.d.ts +0 -36
  494. package/lib/typescript/tools.d.ts.map +0 -1
  495. package/lib/typescript/tts.d.ts +0 -54
  496. package/lib/typescript/tts.d.ts.map +0 -1
  497. package/lib/typescript/vlm.d.ts +0 -33
  498. package/lib/typescript/vlm.d.ts.map +0 -1
  499. package/scripts/postInstall.js +0 -33
  500. package/src/NativeCactus.ts +0 -317
  501. package/src/agent.ts +0 -112
  502. package/src/chat.ts +0 -91
  503. package/src/index.ts +0 -663
  504. package/src/lm.ts +0 -324
  505. package/src/projectId.ts +0 -1
  506. package/src/remote.ts +0 -113
  507. package/src/telemetry.ts +0 -137
  508. package/src/tools.ts +0 -94
  509. package/src/tts.ts +0 -236
  510. package/src/vlm.ts +0 -276
@@ -1,169 +0,0 @@
1
- #pragma once
2
-
3
- #include "llama.h"
4
-
5
- #include "llama-impl.h"
6
- #include "llama-arch.h"
7
- #include "llama-mmap.h"
8
-
9
- #include "ggml-cpp.h"
10
-
11
- #include <cstddef>
12
- #include <map>
13
- #include <stdexcept>
14
- #include <unordered_map>
15
-
16
- using llama_buf_map = std::unordered_map<uint32_t, lm_ggml_backend_buffer_t>;
17
-
18
- enum llama_fver {
19
- LM_GGUF_FILE_VERSION_V1 = 1,
20
- LM_GGUF_FILE_VERSION_V2 = 2,
21
- LM_GGUF_FILE_VERSION_V3 = 3,
22
- };
23
-
24
- const char * llama_file_version_name(llama_fver version);
25
-
26
- struct llama_model_loader {
27
- // Holds information on a model weight
28
- struct llama_tensor_weight {
29
- uint16_t idx; // source file index
30
- size_t offs; // tensor data offset in the original file
31
-
32
- lm_ggml_tensor * tensor;
33
-
34
- llama_tensor_weight(const llama_file * file, uint16_t idx, const struct lm_gguf_context * lm_gguf_ctx, lm_ggml_tensor * tensor) : idx(idx), tensor(tensor) {
35
- const int tensor_idx = lm_gguf_find_tensor(lm_gguf_ctx, lm_ggml_get_name(tensor));
36
- if (tensor_idx < 0) {
37
- throw std::runtime_error(format("tensor '%s' not found in the model", lm_ggml_get_name(tensor)));
38
- }
39
-
40
- offs = lm_gguf_get_data_offset(lm_gguf_ctx) + lm_gguf_get_tensor_offset(lm_gguf_ctx, tensor_idx);
41
- if (offs + lm_ggml_nbytes(tensor) < offs || offs + lm_ggml_nbytes(tensor) > file->size()) {
42
- throw std::runtime_error(format("tensor '%s' data is not within the file bounds, model is corrupted or incomplete", lm_ggml_get_name(tensor)));
43
- }
44
- }
45
- };
46
-
47
- // custom comparator to sort weights more nicely by layer
48
- struct weight_name_comparer {
49
- bool operator()(const std::string & a, const std::string & b) const {
50
- int a_layer = -1;
51
- int b_layer = -1;
52
- sscanf(a.c_str(), "blk.%d.", &a_layer);
53
- sscanf(b.c_str(), "blk.%d.", &b_layer);
54
- if (a_layer != b_layer) {
55
- return a_layer < b_layer;
56
- }
57
- return a < b;
58
- }
59
- };
60
-
61
- static const int TENSOR_NOT_REQUIRED = 1;
62
- static const int TENSOR_DUPLICATED = 2;
63
-
64
- int n_kv = 0;
65
- int n_tensors = 0;
66
- int n_created = 0;
67
-
68
- uint64_t n_elements = 0;
69
- size_t n_bytes = 0;
70
-
71
- bool use_mmap = false;
72
- bool check_tensors;
73
-
74
- llama_files files;
75
- llama_ftype ftype;
76
- llama_fver fver;
77
-
78
- llama_mmaps mappings;
79
-
80
- std::map<std::string, llama_tensor_weight, weight_name_comparer> weights_map;
81
- std::unordered_map<std::string, llama_model_kv_override> kv_overrides;
82
- const llama_model_tensor_buft_override * tensor_buft_overrides;
83
-
84
- lm_gguf_context_ptr meta;
85
- std::vector<lm_ggml_context_ptr> contexts;
86
-
87
- std::string arch_name;
88
- LLM_KV llm_kv = LLM_KV(LLM_ARCH_UNKNOWN);
89
-
90
- size_t size_done = 0;
91
- size_t size_data = 0;
92
- std::vector<std::pair<size_t, size_t>> mmaps_used;
93
-
94
- llama_model_loader(
95
- const std::string & fname,
96
- std::vector<std::string> & splits, // optional, only need if the split does not follow naming scheme
97
- bool use_mmap,
98
- bool check_tensors,
99
- const llama_model_kv_override * param_overrides_p,
100
- const llama_model_tensor_buft_override * param_tensor_buft_overrides_p);
101
-
102
- template<typename T>
103
- typename std::enable_if<std::is_integral<T>::value, bool>::type
104
- get_arr_n(const std::string & key, T & result, bool required = true);
105
-
106
- template<typename T>
107
- typename std::enable_if<std::is_integral<T>::value, bool>::type
108
- get_arr_n(enum llm_kv kid, T & result, bool required = true);
109
-
110
- template<typename T>
111
- bool get_arr(const std::string & key, std::vector<T> & result, bool required = true);
112
-
113
- template<typename T, size_t N_MAX>
114
- bool get_arr(const std::string & key, std::array<T, N_MAX> & result, bool required = true);
115
-
116
- template<typename T>
117
- bool get_arr(enum llm_kv kid, T & result, bool required = true);
118
-
119
- template<typename T>
120
- bool get_key(const std::string & key, T & result, bool required = true);
121
-
122
- template<typename T>
123
- bool get_key(enum llm_kv kid, T & result, bool required = true);
124
-
125
- template<typename T, size_t N_MAX>
126
- bool get_key_or_arr(const std::string & key, std::array<T, N_MAX> & result, uint32_t n, bool required = true);
127
-
128
- template<typename T>
129
- bool get_key_or_arr(enum llm_kv kid, T & result, uint32_t n, bool required = true);
130
-
131
- std::string get_arch_name() const;
132
-
133
- enum llm_arch get_arch() const;
134
-
135
- const llama_tensor_weight * get_weight(const char * name) const;
136
-
137
- const llama_tensor_weight & require_weight(const char * name) const;
138
-
139
- struct lm_ggml_tensor * get_tensor_meta(const char * name) const;
140
-
141
- struct lm_ggml_tensor * require_tensor_meta(const std::string & name) const;
142
-
143
- const struct lm_ggml_tensor * check_tensor_dims(const std::string & name, const std::vector<int64_t> & ne, bool required) const;
144
-
145
- struct lm_ggml_tensor * create_tensor(struct lm_ggml_context * ctx, const std::string & name, const std::initializer_list<int64_t> & ne, int flags = 0);
146
-
147
- struct lm_ggml_tensor * create_tensor_as_view(struct lm_ggml_context * ctx, struct lm_ggml_tensor * base, const std::string & name, const std::initializer_list<int64_t> & ne, size_t offset, bool required = true);
148
-
149
- void done_getting_tensors() const;
150
-
151
- void init_mappings(bool prefetch = true, llama_mlocks * mlock_mmaps = nullptr);
152
-
153
- void get_mapping_range(size_t * first, size_t * last, void ** addr, int idx, lm_ggml_context * ctx) const;
154
-
155
- // for backwards compatibility, does not support ggml-backend
156
- void load_data_for(struct lm_ggml_tensor * cur) const;
157
-
158
- // Returns false if cancelled by progress_callback
159
- bool load_all_data(
160
- struct lm_ggml_context * ctx,
161
- llama_buf_map & bufs,
162
- llama_mlocks * lmlocks,
163
- llama_progress_callback progress_callback,
164
- void * progress_callback_user_data);
165
-
166
- std::string ftype_name() const;
167
-
168
- void print_info() const;
169
- };
@@ -1,37 +0,0 @@
1
- #pragma once
2
-
3
- #include "llama.h"
4
- #include "llama-arch.h"
5
-
6
- #include <vector>
7
-
8
- struct llama_model_saver {
9
- struct lm_gguf_context * lm_gguf_ctx = nullptr;
10
- const struct llama_model & model;
11
- const struct LLM_KV llm_kv;
12
-
13
- llama_model_saver(const struct llama_model & model);
14
- ~llama_model_saver();
15
-
16
- void add_kv(enum llm_kv key, uint32_t value);
17
- void add_kv(enum llm_kv key, int32_t value);
18
- void add_kv(enum llm_kv key, float value);
19
- void add_kv(enum llm_kv key, bool value);
20
- void add_kv(enum llm_kv key, const char * value);
21
-
22
- [[noreturn]]
23
- void add_kv(enum llm_kv key, char value); // needed to make the template below compile
24
-
25
- template <typename Container>
26
- void add_kv(enum llm_kv key, const Container & value, bool per_layer = false);
27
-
28
- void add_kv(enum llm_kv key, const std::vector<std::string> & value);
29
-
30
- void add_tensor(const struct lm_ggml_tensor * tensor);
31
-
32
- void add_kv_from_model();
33
-
34
- void add_tensors_from_model();
35
-
36
- void save(const std::string & path_model);
37
- };
@@ -1,425 +0,0 @@
1
- #pragma once
2
-
3
- #include "llama.h"
4
- #include "llama-arch.h"
5
- #include "llama-graph.h"
6
- #include "llama-hparams.h"
7
- #include "llama-memory.h"
8
- #include "llama-vocab.h"
9
-
10
- #include <memory>
11
- #include <string>
12
- #include <unordered_map>
13
- #include <vector>
14
-
15
- struct llama_cparams;
16
- struct llama_ubatch;
17
- struct llama_model_loader;
18
-
19
- // available models
20
- enum llm_type {
21
- LLM_TYPE_UNKNOWN,
22
- LLM_TYPE_14M,
23
- LLM_TYPE_17M,
24
- LLM_TYPE_22M,
25
- LLM_TYPE_33M,
26
- LLM_TYPE_60M,
27
- LLM_TYPE_70M,
28
- LLM_TYPE_80M,
29
- LLM_TYPE_109M,
30
- LLM_TYPE_137M,
31
- LLM_TYPE_160M,
32
- LLM_TYPE_190M,
33
- LLM_TYPE_220M,
34
- LLM_TYPE_250M,
35
- LLM_TYPE_270M,
36
- LLM_TYPE_335M,
37
- LLM_TYPE_410M,
38
- LLM_TYPE_450M,
39
- LLM_TYPE_475M,
40
- LLM_TYPE_770M,
41
- LLM_TYPE_780M,
42
- LLM_TYPE_0_5B,
43
- LLM_TYPE_0_6B,
44
- LLM_TYPE_1B,
45
- LLM_TYPE_1_3B,
46
- LLM_TYPE_1_4B,
47
- LLM_TYPE_1_5B,
48
- LLM_TYPE_1_6B,
49
- LLM_TYPE_1_7B,
50
- LLM_TYPE_1_8B,
51
- LLM_TYPE_2B,
52
- LLM_TYPE_2_8B,
53
- LLM_TYPE_2_9B,
54
- LLM_TYPE_3B,
55
- LLM_TYPE_4B,
56
- LLM_TYPE_6B,
57
- LLM_TYPE_6_9B,
58
- LLM_TYPE_7B,
59
- LLM_TYPE_8B,
60
- LLM_TYPE_9B,
61
- LLM_TYPE_11B,
62
- LLM_TYPE_12B,
63
- LLM_TYPE_13B,
64
- LLM_TYPE_14B,
65
- LLM_TYPE_15B,
66
- LLM_TYPE_16B,
67
- LLM_TYPE_20B,
68
- LLM_TYPE_27B,
69
- LLM_TYPE_30B,
70
- LLM_TYPE_32B,
71
- LLM_TYPE_34B,
72
- LLM_TYPE_35B,
73
- LLM_TYPE_40B,
74
- LLM_TYPE_65B,
75
- LLM_TYPE_70B,
76
- LLM_TYPE_236B,
77
- LLM_TYPE_290B,
78
- LLM_TYPE_314B,
79
- LLM_TYPE_405B,
80
- LLM_TYPE_671B,
81
- LLM_TYPE_SMALL,
82
- LLM_TYPE_MEDIUM,
83
- LLM_TYPE_LARGE,
84
- LLM_TYPE_XL,
85
- LLM_TYPE_A1_7B,
86
- LLM_TYPE_A2_7B,
87
- LLM_TYPE_8x7B,
88
- LLM_TYPE_8x22B,
89
- LLM_TYPE_16x12B,
90
- LLM_TYPE_16x3_8B,
91
- LLM_TYPE_10B_128x3_66B,
92
- LLM_TYPE_57B_A14B,
93
- LLM_TYPE_17B_16E, // llama4 Scout
94
- LLM_TYPE_17B_128E, // llama4 Maverick
95
- LLM_TYPE_30B_A3B,
96
- LLM_TYPE_235B_A22B,
97
- };
98
-
99
- std::string llama_rope_scaling_type_name(llama_rope_scaling_type rope_scaling_type);
100
-
101
- struct llama_layer_posnet {
102
- // resnet
103
- struct lm_ggml_tensor * norm1 = nullptr;
104
- struct lm_ggml_tensor * norm1_b = nullptr;
105
-
106
- struct lm_ggml_tensor * conv1 = nullptr;
107
- struct lm_ggml_tensor * conv1_b = nullptr;
108
-
109
- struct lm_ggml_tensor * norm2 = nullptr;
110
- struct lm_ggml_tensor * norm2_b = nullptr;
111
-
112
- struct lm_ggml_tensor * conv2 = nullptr;
113
- struct lm_ggml_tensor * conv2_b = nullptr;
114
-
115
- // attention
116
- struct lm_ggml_tensor * attn_norm = nullptr;
117
- struct lm_ggml_tensor * attn_norm_b = nullptr;
118
-
119
- struct lm_ggml_tensor * attn_q = nullptr;
120
- struct lm_ggml_tensor * attn_q_b = nullptr;
121
-
122
- struct lm_ggml_tensor * attn_k = nullptr;
123
- struct lm_ggml_tensor * attn_k_b = nullptr;
124
-
125
- struct lm_ggml_tensor * attn_v = nullptr;
126
- struct lm_ggml_tensor * attn_v_b = nullptr;
127
-
128
- struct lm_ggml_tensor * attn_o = nullptr;
129
- struct lm_ggml_tensor * attn_o_b = nullptr;
130
-
131
- // normalize
132
- struct lm_ggml_tensor * norm = nullptr;
133
- struct lm_ggml_tensor * norm_b = nullptr;
134
- };
135
-
136
- struct llama_layer_convnext {
137
- struct lm_ggml_tensor * dw = nullptr;
138
- struct lm_ggml_tensor * dw_b = nullptr;
139
-
140
- struct lm_ggml_tensor * norm = nullptr;
141
- struct lm_ggml_tensor * norm_b = nullptr;
142
-
143
- struct lm_ggml_tensor * pw1 = nullptr;
144
- struct lm_ggml_tensor * pw1_b = nullptr;
145
-
146
- struct lm_ggml_tensor * pw2 = nullptr;
147
- struct lm_ggml_tensor * pw2_b = nullptr;
148
-
149
- struct lm_ggml_tensor * gamma = nullptr;
150
- };
151
-
152
- struct llama_layer {
153
- // normalization
154
- struct lm_ggml_tensor * attn_norm = nullptr;
155
- struct lm_ggml_tensor * attn_norm_b = nullptr;
156
- struct lm_ggml_tensor * attn_norm_2 = nullptr;
157
- struct lm_ggml_tensor * attn_norm_2_b = nullptr;
158
- struct lm_ggml_tensor * attn_q_norm = nullptr;
159
- struct lm_ggml_tensor * attn_q_norm_b = nullptr;
160
- struct lm_ggml_tensor * attn_k_norm = nullptr;
161
- struct lm_ggml_tensor * attn_k_norm_b = nullptr;
162
- struct lm_ggml_tensor * attn_out_norm = nullptr;
163
- struct lm_ggml_tensor * attn_out_norm_b = nullptr;
164
- struct lm_ggml_tensor * attn_q_a_norm = nullptr;
165
- struct lm_ggml_tensor * attn_kv_a_norm = nullptr;
166
- struct lm_ggml_tensor * attn_sub_norm = nullptr;
167
- struct lm_ggml_tensor * attn_post_norm = nullptr;
168
- struct lm_ggml_tensor * ffn_sub_norm = nullptr;
169
- struct lm_ggml_tensor * attn_norm_cross = nullptr;
170
- struct lm_ggml_tensor * attn_norm_enc = nullptr;
171
-
172
- // attention
173
- struct lm_ggml_tensor * wq = nullptr;
174
- struct lm_ggml_tensor * wk = nullptr;
175
- struct lm_ggml_tensor * wv = nullptr;
176
- struct lm_ggml_tensor * wo = nullptr;
177
- struct lm_ggml_tensor * wqkv = nullptr;
178
- struct lm_ggml_tensor * wq_a = nullptr;
179
- struct lm_ggml_tensor * wq_b = nullptr;
180
- struct lm_ggml_tensor * wkv_a_mqa = nullptr;
181
- struct lm_ggml_tensor * wkv_b = nullptr;
182
- struct lm_ggml_tensor * wk_b = nullptr;
183
- struct lm_ggml_tensor * wv_b = nullptr;
184
- struct lm_ggml_tensor * wq_cross = nullptr;
185
- struct lm_ggml_tensor * wk_cross = nullptr;
186
- struct lm_ggml_tensor * wv_cross = nullptr;
187
- struct lm_ggml_tensor * wo_cross = nullptr;
188
- struct lm_ggml_tensor * wq_enc = nullptr;
189
- struct lm_ggml_tensor * wk_enc = nullptr;
190
- struct lm_ggml_tensor * wv_enc = nullptr;
191
- struct lm_ggml_tensor * wo_enc = nullptr;
192
-
193
- // attention bias
194
- struct lm_ggml_tensor * bq = nullptr;
195
- struct lm_ggml_tensor * bk = nullptr;
196
- struct lm_ggml_tensor * bv = nullptr;
197
- struct lm_ggml_tensor * bo = nullptr;
198
- struct lm_ggml_tensor * bqkv = nullptr;
199
-
200
- // relative position bias
201
- struct lm_ggml_tensor * attn_rel_b = nullptr;
202
- struct lm_ggml_tensor * attn_rel_b_enc = nullptr;
203
- struct lm_ggml_tensor * attn_rel_b_cross = nullptr;
204
-
205
- // normalization
206
- struct lm_ggml_tensor * ffn_norm = nullptr;
207
- struct lm_ggml_tensor * ffn_norm_b = nullptr;
208
- struct lm_ggml_tensor * ffn_post_norm = nullptr;
209
- struct lm_ggml_tensor * layer_out_norm = nullptr;
210
- struct lm_ggml_tensor * layer_out_norm_b = nullptr;
211
- struct lm_ggml_tensor * ffn_norm_exps = nullptr;
212
- struct lm_ggml_tensor * ffn_norm_enc = nullptr;
213
-
214
- // ff
215
- struct lm_ggml_tensor * ffn_gate = nullptr; // w1
216
- struct lm_ggml_tensor * ffn_down = nullptr; // w2
217
- struct lm_ggml_tensor * ffn_up = nullptr; // w3
218
- struct lm_ggml_tensor * ffn_gate_enc = nullptr;
219
- struct lm_ggml_tensor * ffn_down_enc = nullptr;
220
- struct lm_ggml_tensor * ffn_up_enc = nullptr;
221
-
222
- // ff MoE
223
- struct lm_ggml_tensor * ffn_gate_inp = nullptr;
224
- struct lm_ggml_tensor * ffn_gate_exps = nullptr;
225
- struct lm_ggml_tensor * ffn_down_exps = nullptr;
226
- struct lm_ggml_tensor * ffn_up_exps = nullptr;
227
-
228
- // ff shared expert (shexp)
229
- struct lm_ggml_tensor * ffn_gate_inp_shexp = nullptr;
230
- struct lm_ggml_tensor * ffn_gate_shexp = nullptr;
231
- struct lm_ggml_tensor * ffn_down_shexp = nullptr;
232
- struct lm_ggml_tensor * ffn_up_shexp = nullptr;
233
-
234
- // ff bias
235
- struct lm_ggml_tensor * ffn_gate_b = nullptr;
236
- struct lm_ggml_tensor * ffn_down_b = nullptr; // b2
237
- struct lm_ggml_tensor * ffn_up_b = nullptr; // b3
238
- struct lm_ggml_tensor * ffn_act = nullptr;
239
- struct lm_ggml_tensor * ffn_exp_probs_b = nullptr;
240
-
241
- // mamba proj
242
- struct lm_ggml_tensor * ssm_in = nullptr;
243
- struct lm_ggml_tensor * ssm_x = nullptr;
244
- struct lm_ggml_tensor * ssm_dt = nullptr;
245
- struct lm_ggml_tensor * ssm_out = nullptr;
246
-
247
- // mamba
248
- struct lm_ggml_tensor * ssm_conv1d = nullptr;
249
- struct lm_ggml_tensor * ssm_a = nullptr;
250
- struct lm_ggml_tensor * ssm_d = nullptr;
251
-
252
- // mamba bias
253
- struct lm_ggml_tensor * ssm_conv1d_b = nullptr;
254
- struct lm_ggml_tensor * ssm_dt_b = nullptr;
255
-
256
- // rwkv
257
- struct lm_ggml_tensor * time_mix_w1 = nullptr;
258
- struct lm_ggml_tensor * time_mix_w2 = nullptr;
259
- struct lm_ggml_tensor * time_mix_lerp_x = nullptr;
260
- struct lm_ggml_tensor * time_mix_lerp_w = nullptr;
261
- struct lm_ggml_tensor * time_mix_lerp_k = nullptr;
262
- struct lm_ggml_tensor * time_mix_lerp_v = nullptr;
263
- struct lm_ggml_tensor * time_mix_lerp_r = nullptr;
264
- struct lm_ggml_tensor * time_mix_lerp_g = nullptr;
265
- struct lm_ggml_tensor * time_mix_lerp_fused = nullptr;
266
-
267
- struct lm_ggml_tensor * time_mix_first = nullptr;
268
- struct lm_ggml_tensor * time_mix_decay = nullptr;
269
- struct lm_ggml_tensor * time_mix_decay_w1 = nullptr;
270
- struct lm_ggml_tensor * time_mix_decay_w2 = nullptr;
271
- struct lm_ggml_tensor * time_mix_key = nullptr;
272
- struct lm_ggml_tensor * time_mix_key_b = nullptr;
273
- struct lm_ggml_tensor * time_mix_value = nullptr;
274
- struct lm_ggml_tensor * time_mix_value_b = nullptr;
275
- struct lm_ggml_tensor * time_mix_receptance = nullptr;
276
- struct lm_ggml_tensor * time_mix_receptance_b = nullptr;
277
- struct lm_ggml_tensor * time_mix_gate = nullptr;
278
-
279
- // rwkv7
280
- struct lm_ggml_tensor * time_mix_w0 = nullptr;
281
- struct lm_ggml_tensor * time_mix_a0 = nullptr;
282
- struct lm_ggml_tensor * time_mix_a1 = nullptr;
283
- struct lm_ggml_tensor * time_mix_a2 = nullptr;
284
- struct lm_ggml_tensor * time_mix_v0 = nullptr;
285
- struct lm_ggml_tensor * time_mix_v1 = nullptr;
286
- struct lm_ggml_tensor * time_mix_v2 = nullptr;
287
- struct lm_ggml_tensor * time_mix_g1 = nullptr;
288
- struct lm_ggml_tensor * time_mix_g2 = nullptr;
289
- struct lm_ggml_tensor * time_mix_k_k = nullptr;
290
- struct lm_ggml_tensor * time_mix_k_a = nullptr;
291
- struct lm_ggml_tensor * time_mix_r_k = nullptr;
292
-
293
- struct lm_ggml_tensor * time_mix_ln = nullptr;
294
- struct lm_ggml_tensor * time_mix_ln_b = nullptr;
295
- struct lm_ggml_tensor * time_mix_output = nullptr;
296
-
297
- struct lm_ggml_tensor * channel_mix_lerp_k = nullptr;
298
- struct lm_ggml_tensor * channel_mix_lerp_r = nullptr;
299
-
300
- struct lm_ggml_tensor * channel_mix_key = nullptr;
301
- struct lm_ggml_tensor * channel_mix_receptance = nullptr;
302
- struct lm_ggml_tensor * channel_mix_value = nullptr;
303
-
304
- // long rope factors
305
- struct lm_ggml_tensor * rope_long = nullptr;
306
- struct lm_ggml_tensor * rope_short = nullptr;
307
- struct lm_ggml_tensor * rope_freqs = nullptr;
308
-
309
- // bitnet scale
310
- struct lm_ggml_tensor * wq_scale = nullptr;
311
- struct lm_ggml_tensor * wk_scale = nullptr;
312
- struct lm_ggml_tensor * wv_scale = nullptr;
313
- struct lm_ggml_tensor * wo_scale = nullptr;
314
- struct lm_ggml_tensor * ffn_gate_scale = nullptr;
315
- struct lm_ggml_tensor * ffn_up_scale = nullptr;
316
- struct lm_ggml_tensor * ffn_down_scale = nullptr;
317
-
318
- struct llama_layer_posnet posnet;
319
-
320
- struct llama_layer_convnext convnext;
321
- };
322
-
323
- struct llama_model {
324
- llm_type type = LLM_TYPE_UNKNOWN;
325
- llm_arch arch = LLM_ARCH_UNKNOWN;
326
-
327
- std::string name = "n/a";
328
-
329
- llama_hparams hparams = {};
330
- llama_vocab vocab;
331
-
332
- struct lm_ggml_tensor * tok_embd = nullptr;
333
- struct lm_ggml_tensor * type_embd = nullptr;
334
- struct lm_ggml_tensor * pos_embd = nullptr;
335
- struct lm_ggml_tensor * tok_norm = nullptr;
336
- struct lm_ggml_tensor * tok_norm_b = nullptr;
337
-
338
- struct lm_ggml_tensor * output_norm = nullptr;
339
- struct lm_ggml_tensor * output_norm_b = nullptr;
340
- struct lm_ggml_tensor * output = nullptr;
341
- struct lm_ggml_tensor * output_b = nullptr;
342
- struct lm_ggml_tensor * output_norm_enc = nullptr;
343
-
344
- // classifier
345
- struct lm_ggml_tensor * cls = nullptr;
346
- struct lm_ggml_tensor * cls_b = nullptr;
347
- struct lm_ggml_tensor * cls_out = nullptr;
348
- struct lm_ggml_tensor * cls_out_b = nullptr;
349
-
350
- struct lm_ggml_tensor * conv1d = nullptr;
351
- struct lm_ggml_tensor * conv1d_b = nullptr;
352
-
353
- std::vector<llama_layer> layers;
354
-
355
- llama_model_params params;
356
-
357
- // gguf metadata
358
- std::unordered_map<std::string, std::string> lm_gguf_kv;
359
-
360
- // list of devices used in this model
361
- std::vector<lm_ggml_backend_dev_t> devices;
362
-
363
- // for quantize-stats only
364
- std::vector<std::pair<std::string, struct lm_ggml_tensor *>> tensors_by_name;
365
-
366
- int64_t t_load_us = 0;
367
- int64_t t_start_us = 0;
368
-
369
- explicit llama_model(const struct llama_model_params & params);
370
- ~llama_model();
371
-
372
- void load_stats (llama_model_loader & ml);
373
- void load_arch (llama_model_loader & ml);
374
- void load_hparams(llama_model_loader & ml);
375
- void load_vocab (llama_model_loader & ml);
376
- bool load_tensors(llama_model_loader & ml); // returns false if cancelled by progress_callback
377
-
378
- std::string arch_name() const;
379
- std::string type_name() const;
380
-
381
- std::string desc() const;
382
-
383
- size_t size() const;
384
- size_t n_tensors() const;
385
- size_t n_devices() const;
386
-
387
- // total number of parameters in the model
388
- uint64_t n_elements() const;
389
-
390
- void print_info() const;
391
-
392
- lm_ggml_backend_dev_t dev_layer(int il) const;
393
- lm_ggml_backend_dev_t dev_output() const;
394
-
395
- lm_ggml_backend_buffer_type_t select_buft(int il) const;
396
-
397
- bool has_tensor_overrides() const;
398
-
399
- const struct lm_ggml_tensor * get_tensor(const char * name) const;
400
-
401
- float get_rope_freq_base (const llama_cparams & cparams, int il) const;
402
- float get_rope_freq_scale(const llama_cparams & cparams, int il) const;
403
-
404
- lm_ggml_tensor * get_rope_factors(const llama_cparams & cparams, int il) const;
405
-
406
- // note: can mutate `cparams`
407
- // TODO: move this to new llm_arch_model_i interface
408
- llama_memory_i * create_memory(const llama_memory_params & params, llama_cparams & cparams) const;
409
-
410
- // TODO: move this to new llm_arch_model_i interface
411
- llm_graph_result_ptr build_graph(
412
- const llm_graph_params & params,
413
- lm_ggml_cgraph * gf,
414
- llm_graph_type type) const;
415
-
416
- private:
417
- struct impl;
418
- std::unique_ptr<impl> pimpl;
419
- };
420
-
421
- const char * llm_type_name(llm_type type);
422
-
423
- // For internal test use
424
- // TODO: remove
425
- const std::vector<std::pair<std::string, lm_ggml_tensor *>> & llama_internal_get_tensor_map(const llama_model * model);
@@ -1,32 +0,0 @@
1
- #pragma once
2
-
3
- // TODO: rename llama-sampling.h/.cpp to llama-sampler.h/.cpp ?
4
-
5
- #include "llama.h"
6
-
7
- #include <vector>
8
-
9
- struct llama_vocab;
10
- struct llama_grammar;
11
-
12
- // sampler chain
13
-
14
- struct llama_sampler_chain {
15
- llama_sampler_chain_params params;
16
-
17
- std::vector<struct llama_sampler *> samplers;
18
-
19
- // timing
20
-
21
- mutable int64_t t_sample_us;
22
-
23
- mutable int32_t n_sample;
24
- };
25
-
26
- struct llama_sampler * llama_sampler_init_dry_testing(
27
- int32_t context_size,
28
- float dry_multiplier,
29
- float dry_base,
30
- int32_t dry_allowed_length,
31
- int32_t dry_penalty_last_n,
32
- const std::vector<std::vector<llama_token>>& seq_breakers);