cactus-react-native 0.2.11 → 1.0.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/Cactus.podspec +34 -0
- package/LICENSE +38 -0
- package/README.md +550 -69
- package/android/CMakeLists.txt +40 -0
- package/android/build.gradle +68 -44
- package/android/gradle.properties +5 -5
- package/android/src/main/AndroidManifest.xml +1 -3
- package/android/src/main/cpp/cpp-adapter.cpp +6 -0
- package/android/src/main/java/com/margelo/nitro/cactus/CactusPackage.kt +22 -0
- package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusCrypto.kt +38 -0
- package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusDeviceInfo.kt +24 -0
- package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusFileSystem.kt +227 -0
- package/android/src/main/jniLibs/arm64-v8a/{libcactus_v8.so → libcactus.a} +0 -0
- package/android/src/main/jniLibs/arm64-v8a/libcactus_util.so +0 -0
- package/cpp/HybridCactus.cpp +135 -0
- package/cpp/HybridCactus.hpp +42 -0
- package/cpp/HybridCactusUtil.cpp +47 -0
- package/cpp/HybridCactusUtil.hpp +26 -0
- package/cpp/cactus_ffi.h +55 -0
- package/cpp/cactus_util.h +25 -0
- package/ios/HybridCactusCrypto.swift +37 -0
- package/ios/HybridCactusDeviceInfo.swift +32 -0
- package/ios/HybridCactusFileSystem.swift +234 -0
- package/ios/cactus.xcframework/{info.plist → Info.plist} +2 -37
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/cactus.h +8 -229
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/cactus_ffi.h +28 -229
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/engine.h +545 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ffi_utils.h +400 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/graph.h +338 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/kernel.h +275 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/kernel_utils.h +343 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Info.plist +0 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/cactus +0 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/cactus.h +11 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/cactus_ffi.h +55 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/engine.h +545 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/ffi_utils.h +400 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/graph.h +338 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/kernel.h +275 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/kernel_utils.h +343 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Info.plist +0 -0
- package/ios/cactus.xcframework/{tvos-arm64_x86_64-simulator → ios-arm64-simulator}/cactus.framework/_CodeSignature/CodeResources +1 -1
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/cactus +0 -0
- package/ios/cactus_util.xcframework/Info.plist +39 -0
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/cactus_util.h +25 -0
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/ios_utils.h +10 -0
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/logging.h +25 -0
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Info.plist +0 -0
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/cactus_util +0 -0
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/cactus_util.h +25 -0
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/ios_utils.h +10 -0
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/logging.h +25 -0
- package/ios/{cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework → cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework}/Info.plist +0 -0
- package/ios/{cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework → cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework}/_CodeSignature/CodeResources +36 -2
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/cactus_util +0 -0
- package/lib/module/api/Database.js +60 -0
- package/lib/module/api/Database.js.map +1 -0
- package/lib/module/classes/CactusLM.js +151 -0
- package/lib/module/classes/CactusLM.js.map +1 -0
- package/lib/module/config/CactusConfig.js +6 -0
- package/lib/module/config/CactusConfig.js.map +1 -0
- package/lib/module/constants/packageVersion.js +4 -0
- package/lib/module/constants/packageVersion.js.map +1 -0
- package/lib/module/hooks/useCactusLM.js +238 -0
- package/lib/module/hooks/useCactusLM.js.map +1 -0
- package/lib/module/index.js +9 -409
- package/lib/module/index.js.map +1 -1
- package/lib/module/native/Cactus.js +50 -0
- package/lib/module/native/Cactus.js.map +1 -0
- package/lib/module/native/CactusCrypto.js +10 -0
- package/lib/module/native/CactusCrypto.js.map +1 -0
- package/lib/module/native/CactusDeviceInfo.js +13 -0
- package/lib/module/native/CactusDeviceInfo.js.map +1 -0
- package/lib/module/native/CactusFileSystem.js +35 -0
- package/lib/module/native/CactusFileSystem.js.map +1 -0
- package/lib/module/native/CactusUtil.js +23 -0
- package/lib/module/native/CactusUtil.js.map +1 -0
- package/lib/module/native/index.js +8 -0
- package/lib/module/native/index.js.map +1 -0
- package/lib/module/specs/Cactus.nitro.js +4 -0
- package/lib/module/specs/Cactus.nitro.js.map +1 -0
- package/lib/module/specs/CactusCrypto.nitro.js +4 -0
- package/lib/module/specs/CactusCrypto.nitro.js.map +1 -0
- package/lib/module/specs/CactusDeviceInfo.nitro.js +4 -0
- package/lib/module/specs/CactusDeviceInfo.nitro.js.map +1 -0
- package/lib/module/specs/CactusFileSystem.nitro.js +4 -0
- package/lib/module/specs/CactusFileSystem.nitro.js.map +1 -0
- package/lib/module/specs/CactusUtil.nitro.js +4 -0
- package/lib/module/specs/CactusUtil.nitro.js.map +1 -0
- package/lib/module/telemetry/Telemetry.js +100 -0
- package/lib/module/telemetry/Telemetry.js.map +1 -0
- package/lib/module/types/CactusLM.js +2 -0
- package/lib/module/types/CactusLM.js.map +1 -0
- package/lib/module/types/CactusModel.js +2 -0
- package/lib/module/types/CactusModel.js.map +1 -0
- package/lib/module/utils/error.js +4 -0
- package/lib/module/utils/error.js.map +1 -0
- package/lib/typescript/package.json +1 -0
- package/lib/typescript/src/api/Database.d.ts +11 -0
- package/lib/typescript/src/api/Database.d.ts.map +1 -0
- package/lib/typescript/src/classes/CactusLM.d.ts +26 -0
- package/lib/typescript/src/classes/CactusLM.d.ts.map +1 -0
- package/lib/typescript/src/config/CactusConfig.d.ts +5 -0
- package/lib/typescript/src/config/CactusConfig.d.ts.map +1 -0
- package/lib/typescript/src/constants/packageVersion.d.ts +2 -0
- package/lib/typescript/src/constants/packageVersion.d.ts.map +1 -0
- package/lib/typescript/src/hooks/useCactusLM.d.ts +20 -0
- package/lib/typescript/src/hooks/useCactusLM.d.ts.map +1 -0
- package/lib/typescript/src/index.d.ts +6 -0
- package/lib/typescript/src/index.d.ts.map +1 -0
- package/lib/typescript/src/native/Cactus.d.ts +11 -0
- package/lib/typescript/src/native/Cactus.d.ts.map +1 -0
- package/lib/typescript/src/native/CactusCrypto.d.ts +5 -0
- package/lib/typescript/src/native/CactusCrypto.d.ts.map +1 -0
- package/lib/typescript/src/native/CactusDeviceInfo.d.ts +7 -0
- package/lib/typescript/src/native/CactusDeviceInfo.d.ts.map +1 -0
- package/lib/typescript/src/native/CactusFileSystem.d.ts +13 -0
- package/lib/typescript/src/native/CactusFileSystem.d.ts.map +1 -0
- package/lib/typescript/src/native/CactusUtil.d.ts +6 -0
- package/lib/typescript/src/native/CactusUtil.d.ts.map +1 -0
- package/lib/typescript/src/native/index.d.ts +6 -0
- package/lib/typescript/src/native/index.d.ts.map +1 -0
- package/lib/typescript/src/specs/Cactus.nitro.d.ts +13 -0
- package/lib/typescript/src/specs/Cactus.nitro.d.ts.map +1 -0
- package/lib/typescript/src/specs/CactusCrypto.nitro.d.ts +8 -0
- package/lib/typescript/src/specs/CactusCrypto.nitro.d.ts.map +1 -0
- package/lib/typescript/src/specs/CactusDeviceInfo.nitro.d.ts +16 -0
- package/lib/typescript/src/specs/CactusDeviceInfo.nitro.d.ts.map +1 -0
- package/lib/typescript/src/specs/CactusFileSystem.nitro.d.ts +16 -0
- package/lib/typescript/src/specs/CactusFileSystem.nitro.d.ts.map +1 -0
- package/lib/typescript/src/specs/CactusUtil.nitro.d.ts +10 -0
- package/lib/typescript/src/specs/CactusUtil.nitro.d.ts.map +1 -0
- package/lib/typescript/src/telemetry/Telemetry.d.ts +30 -0
- package/lib/typescript/src/telemetry/Telemetry.d.ts.map +1 -0
- package/lib/typescript/src/types/CactusLM.d.ts +67 -0
- package/lib/typescript/src/types/CactusLM.d.ts.map +1 -0
- package/lib/typescript/src/types/CactusModel.d.ts +12 -0
- package/lib/typescript/src/types/CactusModel.d.ts.map +1 -0
- package/lib/typescript/src/utils/error.d.ts +2 -0
- package/lib/typescript/src/utils/error.d.ts.map +1 -0
- package/nitro.json +31 -0
- package/nitrogen/generated/android/c++/JDeviceInfo.hpp +74 -0
- package/nitrogen/generated/android/c++/JFunc_void_double.hpp +74 -0
- package/nitrogen/generated/android/c++/JHybridCactusCryptoSpec.cpp +65 -0
- package/nitrogen/generated/android/c++/JHybridCactusCryptoSpec.hpp +65 -0
- package/nitrogen/generated/android/c++/JHybridCactusDeviceInfoSpec.cpp +85 -0
- package/nitrogen/generated/android/c++/JHybridCactusDeviceInfoSpec.hpp +66 -0
- package/nitrogen/generated/android/c++/JHybridCactusFileSystemSpec.cpp +192 -0
- package/nitrogen/generated/android/c++/JHybridCactusFileSystemSpec.hpp +73 -0
- package/nitrogen/generated/android/cactus+autolinking.cmake +87 -0
- package/nitrogen/generated/android/cactus+autolinking.gradle +27 -0
- package/nitrogen/generated/android/cactusOnLoad.cpp +86 -0
- package/nitrogen/generated/android/cactusOnLoad.hpp +25 -0
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/DeviceInfo.kt +50 -0
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/Func_void_double.kt +80 -0
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusCryptoSpec.kt +58 -0
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusDeviceInfoSpec.kt +62 -0
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusFileSystemSpec.kt +95 -0
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/cactusOnLoad.kt +35 -0
- package/nitrogen/generated/ios/Cactus+autolinking.rb +60 -0
- package/nitrogen/generated/ios/Cactus-Swift-Cxx-Bridge.cpp +122 -0
- package/nitrogen/generated/ios/Cactus-Swift-Cxx-Bridge.hpp +373 -0
- package/nitrogen/generated/ios/Cactus-Swift-Cxx-Umbrella.hpp +60 -0
- package/nitrogen/generated/ios/CactusAutolinking.mm +69 -0
- package/nitrogen/generated/ios/CactusAutolinking.swift +55 -0
- package/nitrogen/generated/ios/c++/HybridCactusCryptoSpecSwift.cpp +11 -0
- package/nitrogen/generated/ios/c++/HybridCactusCryptoSpecSwift.hpp +77 -0
- package/nitrogen/generated/ios/c++/HybridCactusDeviceInfoSpecSwift.cpp +11 -0
- package/nitrogen/generated/ios/c++/HybridCactusDeviceInfoSpecSwift.hpp +88 -0
- package/nitrogen/generated/ios/c++/HybridCactusFileSystemSpecSwift.cpp +11 -0
- package/nitrogen/generated/ios/c++/HybridCactusFileSystemSpecSwift.hpp +143 -0
- package/nitrogen/generated/ios/swift/DeviceInfo.swift +98 -0
- package/nitrogen/generated/ios/swift/Func_void.swift +47 -0
- package/nitrogen/generated/ios/swift/Func_void_DeviceInfo.swift +47 -0
- package/nitrogen/generated/ios/swift/Func_void_bool.swift +47 -0
- package/nitrogen/generated/ios/swift/Func_void_double.swift +47 -0
- package/nitrogen/generated/ios/swift/Func_void_std__exception_ptr.swift +47 -0
- package/nitrogen/generated/ios/swift/Func_void_std__optional_std__string_.swift +54 -0
- package/nitrogen/generated/ios/swift/Func_void_std__string.swift +47 -0
- package/nitrogen/generated/ios/swift/HybridCactusCryptoSpec.swift +57 -0
- package/nitrogen/generated/ios/swift/HybridCactusCryptoSpec_cxx.swift +139 -0
- package/nitrogen/generated/ios/swift/HybridCactusDeviceInfoSpec.swift +58 -0
- package/nitrogen/generated/ios/swift/HybridCactusDeviceInfoSpec_cxx.swift +164 -0
- package/nitrogen/generated/ios/swift/HybridCactusFileSystemSpec.swift +65 -0
- package/nitrogen/generated/ios/swift/HybridCactusFileSystemSpec_cxx.swift +303 -0
- package/nitrogen/generated/shared/c++/DeviceInfo.hpp +92 -0
- package/nitrogen/generated/shared/c++/HybridCactusCryptoSpec.cpp +21 -0
- package/nitrogen/generated/shared/c++/HybridCactusCryptoSpec.hpp +63 -0
- package/nitrogen/generated/shared/c++/HybridCactusDeviceInfoSpec.cpp +22 -0
- package/nitrogen/generated/shared/c++/HybridCactusDeviceInfoSpec.hpp +67 -0
- package/nitrogen/generated/shared/c++/HybridCactusFileSystemSpec.cpp +29 -0
- package/nitrogen/generated/shared/c++/HybridCactusFileSystemSpec.hpp +73 -0
- package/nitrogen/generated/shared/c++/HybridCactusSpec.cpp +26 -0
- package/nitrogen/generated/shared/c++/HybridCactusSpec.hpp +71 -0
- package/nitrogen/generated/shared/c++/HybridCactusUtilSpec.cpp +23 -0
- package/nitrogen/generated/shared/c++/HybridCactusUtilSpec.hpp +66 -0
- package/package.json +84 -143
- package/src/api/Database.ts +83 -0
- package/src/classes/CactusLM.ts +205 -0
- package/src/config/CactusConfig.ts +4 -0
- package/src/constants/packageVersion.ts +1 -0
- package/src/hooks/useCactusLM.ts +285 -0
- package/src/index.tsx +23 -0
- package/src/native/Cactus.ts +83 -0
- package/src/native/CactusCrypto.ts +11 -0
- package/src/native/CactusDeviceInfo.ts +18 -0
- package/src/native/CactusFileSystem.ts +47 -0
- package/src/native/CactusUtil.ts +27 -0
- package/src/native/index.ts +5 -0
- package/src/specs/Cactus.nitro.ts +20 -0
- package/src/specs/CactusCrypto.nitro.ts +6 -0
- package/src/specs/CactusDeviceInfo.nitro.ts +15 -0
- package/src/specs/CactusFileSystem.nitro.ts +21 -0
- package/src/specs/CactusUtil.nitro.ts +8 -0
- package/src/telemetry/Telemetry.ts +159 -0
- package/src/types/CactusLM.ts +73 -0
- package/src/types/CactusModel.ts +14 -0
- package/src/utils/error.ts +2 -0
- package/LICENSE.txt +0 -20
- package/android/src/main/CMakeLists.txt +0 -140
- package/android/src/main/java/com/cactus/Cactus.java +0 -1190
- package/android/src/main/java/com/cactus/CactusPackage.java +0 -48
- package/android/src/main/java/com/cactus/LlamaContext.java +0 -748
- package/android/src/main/jni-utils.h +0 -100
- package/android/src/main/jni.cpp +0 -1605
- package/android/src/main/jniLibs/arm64-v8a/libcactus.so +0 -0
- package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2.so +0 -0
- package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2_dotprod.so +0 -0
- package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2_dotprod_i8mm.so +0 -0
- package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2_i8mm.so +0 -0
- package/android/src/newarch/java/com/cactus/CactusModule.java +0 -204
- package/android/src/oldarch/java/com/cactus/CactusModule.java +0 -205
- package/cactus-react-native.podspec +0 -42
- package/ios/CMakeLists.txt +0 -131
- package/ios/Cactus.h +0 -6
- package/ios/Cactus.mm +0 -681
- package/ios/CactusContext.h +0 -81
- package/ios/CactusContext.mm +0 -1032
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/chat.h +0 -145
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/common.h +0 -674
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-alloc.h +0 -76
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-backend-impl.h +0 -255
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-backend.h +0 -354
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-common.h +0 -1857
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-cpp.h +0 -39
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-cpu.h +0 -143
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-impl.h +0 -601
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-metal-impl.h +0 -622
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-metal.h +0 -66
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-opt.h +0 -237
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-quants.h +0 -100
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-threading.h +0 -14
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml.h +0 -2202
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/gguf.h +0 -202
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/json.hpp +0 -24766
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-adapter.h +0 -76
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-arch.h +0 -437
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-batch.h +0 -89
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-chat.h +0 -58
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-context.h +0 -276
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-cparams.h +0 -39
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-cpp.h +0 -30
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-grammar.h +0 -173
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-graph.h +0 -640
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-hparams.h +0 -190
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-impl.h +0 -61
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-io.h +0 -35
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-kv-cache.h +0 -515
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-memory.h +0 -32
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-mmap.h +0 -68
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-model-loader.h +0 -169
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-model-saver.h +0 -37
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-model.h +0 -425
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-sampling.h +0 -32
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-vocab.h +0 -131
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama.h +0 -1376
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/log.h +0 -103
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/minja/chat-template.hpp +0 -542
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/minja/minja.hpp +0 -2974
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/sampling.h +0 -107
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/unicode-data.h +0 -20
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/unicode.h +0 -66
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/ggml-llama.metallib +0 -0
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/cactus.h +0 -232
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/cactus_ffi.h +0 -256
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/chat.h +0 -145
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/common.h +0 -674
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-alloc.h +0 -76
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend-impl.h +0 -255
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend.h +0 -354
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-common.h +0 -1857
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpp.h +0 -39
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpu.h +0 -143
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-impl.h +0 -601
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal-impl.h +0 -622
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal.h +0 -66
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-opt.h +0 -237
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-quants.h +0 -100
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-threading.h +0 -14
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml.h +0 -2202
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/gguf.h +0 -202
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/json.hpp +0 -24766
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-adapter.h +0 -76
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-arch.h +0 -437
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-batch.h +0 -89
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-chat.h +0 -58
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-context.h +0 -276
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-cparams.h +0 -39
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-cpp.h +0 -30
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-grammar.h +0 -173
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-graph.h +0 -640
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-hparams.h +0 -190
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-impl.h +0 -61
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-io.h +0 -35
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-kv-cache.h +0 -515
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-memory.h +0 -32
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-mmap.h +0 -68
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-loader.h +0 -169
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-saver.h +0 -37
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-model.h +0 -425
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-sampling.h +0 -32
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-vocab.h +0 -131
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama.h +0 -1376
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/log.h +0 -103
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/minja/chat-template.hpp +0 -542
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/minja/minja.hpp +0 -2974
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/sampling.h +0 -107
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/unicode-data.h +0 -20
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/unicode.h +0 -66
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/cactus +0 -0
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/ggml-llama-sim.metallib +0 -0
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/cactus.h +0 -232
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/cactus_ffi.h +0 -256
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/chat.h +0 -145
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/common.h +0 -674
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-alloc.h +0 -76
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-backend-impl.h +0 -255
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-backend.h +0 -354
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-common.h +0 -1857
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-cpp.h +0 -39
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-cpu.h +0 -143
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-impl.h +0 -601
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-metal-impl.h +0 -622
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-metal.h +0 -66
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-opt.h +0 -237
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-quants.h +0 -100
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-threading.h +0 -14
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml.h +0 -2202
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/gguf.h +0 -202
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/json.hpp +0 -24766
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-adapter.h +0 -76
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-arch.h +0 -437
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-batch.h +0 -89
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-chat.h +0 -58
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-context.h +0 -276
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-cparams.h +0 -39
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-cpp.h +0 -30
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-grammar.h +0 -173
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-graph.h +0 -640
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-hparams.h +0 -190
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-impl.h +0 -61
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-io.h +0 -35
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-kv-cache.h +0 -515
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-memory.h +0 -32
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-mmap.h +0 -68
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-model-loader.h +0 -169
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-model-saver.h +0 -37
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-model.h +0 -425
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-sampling.h +0 -32
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-vocab.h +0 -131
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama.h +0 -1376
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/log.h +0 -103
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/minja/chat-template.hpp +0 -542
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/minja/minja.hpp +0 -2974
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/sampling.h +0 -107
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/unicode-data.h +0 -20
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/unicode.h +0 -66
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Info.plist +0 -0
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/cactus +0 -0
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/ggml-llama.metallib +0 -0
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/cactus.h +0 -232
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/cactus_ffi.h +0 -256
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/chat.h +0 -145
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/common.h +0 -674
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-alloc.h +0 -76
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend-impl.h +0 -255
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend.h +0 -354
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-common.h +0 -1857
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpp.h +0 -39
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpu.h +0 -143
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-impl.h +0 -601
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal-impl.h +0 -622
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal.h +0 -66
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-opt.h +0 -237
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-quants.h +0 -100
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-threading.h +0 -14
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml.h +0 -2202
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/gguf.h +0 -202
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/json.hpp +0 -24766
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-adapter.h +0 -76
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-arch.h +0 -437
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-batch.h +0 -89
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-chat.h +0 -58
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-context.h +0 -276
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-cparams.h +0 -39
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-cpp.h +0 -30
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-grammar.h +0 -173
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-graph.h +0 -640
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-hparams.h +0 -190
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-impl.h +0 -61
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-io.h +0 -35
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-kv-cache.h +0 -515
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-memory.h +0 -32
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-mmap.h +0 -68
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-loader.h +0 -169
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-saver.h +0 -37
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-model.h +0 -425
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-sampling.h +0 -32
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-vocab.h +0 -131
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama.h +0 -1376
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/log.h +0 -103
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/minja/chat-template.hpp +0 -542
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/minja/minja.hpp +0 -2974
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/sampling.h +0 -107
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/unicode-data.h +0 -20
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/unicode.h +0 -66
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Info.plist +0 -0
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/cactus +0 -0
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/ggml-llama-sim.metallib +0 -0
- package/lib/commonjs/NativeCactus.js +0 -9
- package/lib/commonjs/NativeCactus.js.map +0 -1
- package/lib/commonjs/agent.js +0 -73
- package/lib/commonjs/agent.js.map +0 -1
- package/lib/commonjs/chat.js +0 -73
- package/lib/commonjs/chat.js.map +0 -1
- package/lib/commonjs/index.js +0 -523
- package/lib/commonjs/index.js.map +0 -1
- package/lib/commonjs/lm.js +0 -272
- package/lib/commonjs/lm.js.map +0 -1
- package/lib/commonjs/package.json +0 -1
- package/lib/commonjs/projectId.js +0 -9
- package/lib/commonjs/projectId.js.map +0 -1
- package/lib/commonjs/remote.js +0 -100
- package/lib/commonjs/remote.js.map +0 -1
- package/lib/commonjs/telemetry.js +0 -102
- package/lib/commonjs/telemetry.js.map +0 -1
- package/lib/commonjs/tools.js +0 -72
- package/lib/commonjs/tools.js.map +0 -1
- package/lib/commonjs/tts.js +0 -141
- package/lib/commonjs/tts.js.map +0 -1
- package/lib/commonjs/vlm.js +0 -221
- package/lib/commonjs/vlm.js.map +0 -1
- package/lib/module/NativeCactus.js +0 -5
- package/lib/module/NativeCactus.js.map +0 -1
- package/lib/module/agent.js +0 -68
- package/lib/module/agent.js.map +0 -1
- package/lib/module/chat.js +0 -67
- package/lib/module/chat.js.map +0 -1
- package/lib/module/lm.js +0 -267
- package/lib/module/lm.js.map +0 -1
- package/lib/module/projectId.js +0 -5
- package/lib/module/projectId.js.map +0 -1
- package/lib/module/remote.js +0 -91
- package/lib/module/remote.js.map +0 -1
- package/lib/module/telemetry.js +0 -97
- package/lib/module/telemetry.js.map +0 -1
- package/lib/module/tools.js +0 -66
- package/lib/module/tools.js.map +0 -1
- package/lib/module/tts.js +0 -135
- package/lib/module/tts.js.map +0 -1
- package/lib/module/vlm.js +0 -216
- package/lib/module/vlm.js.map +0 -1
- package/lib/typescript/NativeCactus.d.ts +0 -252
- package/lib/typescript/NativeCactus.d.ts.map +0 -1
- package/lib/typescript/agent.d.ts +0 -31
- package/lib/typescript/agent.d.ts.map +0 -1
- package/lib/typescript/chat.d.ts +0 -23
- package/lib/typescript/chat.d.ts.map +0 -1
- package/lib/typescript/index.d.ts +0 -114
- package/lib/typescript/index.d.ts.map +0 -1
- package/lib/typescript/lm.d.ts +0 -36
- package/lib/typescript/lm.d.ts.map +0 -1
- package/lib/typescript/projectId.d.ts +0 -2
- package/lib/typescript/projectId.d.ts.map +0 -1
- package/lib/typescript/remote.d.ts +0 -8
- package/lib/typescript/remote.d.ts.map +0 -1
- package/lib/typescript/telemetry.d.ts +0 -25
- package/lib/typescript/telemetry.d.ts.map +0 -1
- package/lib/typescript/tools.d.ts +0 -36
- package/lib/typescript/tools.d.ts.map +0 -1
- package/lib/typescript/tts.d.ts +0 -54
- package/lib/typescript/tts.d.ts.map +0 -1
- package/lib/typescript/vlm.d.ts +0 -33
- package/lib/typescript/vlm.d.ts.map +0 -1
- package/scripts/postInstall.js +0 -33
- package/src/NativeCactus.ts +0 -317
- package/src/agent.ts +0 -112
- package/src/chat.ts +0 -91
- package/src/index.ts +0 -663
- package/src/lm.ts +0 -324
- package/src/projectId.ts +0 -1
- package/src/remote.ts +0 -113
- package/src/telemetry.ts +0 -137
- package/src/tools.ts +0 -94
- package/src/tts.ts +0 -236
- package/src/vlm.ts +0 -276
package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-adapter.h
DELETED
|
@@ -1,76 +0,0 @@
|
|
|
1
|
-
#pragma once
|
|
2
|
-
|
|
3
|
-
#include "llama.h"
|
|
4
|
-
|
|
5
|
-
#include "ggml-cpp.h"
|
|
6
|
-
|
|
7
|
-
#include <string>
|
|
8
|
-
#include <unordered_map>
|
|
9
|
-
#include <vector>
|
|
10
|
-
|
|
11
|
-
// TODO: pimpl
|
|
12
|
-
|
|
13
|
-
//
|
|
14
|
-
// llama_adapter_cvec
|
|
15
|
-
//
|
|
16
|
-
|
|
17
|
-
struct llama_adapter_cvec {
|
|
18
|
-
lm_ggml_tensor * tensor_for(int il) const;
|
|
19
|
-
|
|
20
|
-
lm_ggml_tensor * apply_to(lm_ggml_context * ctx, lm_ggml_tensor * cur, int il) const;
|
|
21
|
-
|
|
22
|
-
bool apply(
|
|
23
|
-
const llama_model & model,
|
|
24
|
-
const float * data,
|
|
25
|
-
size_t len,
|
|
26
|
-
int32_t n_embd,
|
|
27
|
-
int32_t il_start,
|
|
28
|
-
int32_t il_end);
|
|
29
|
-
|
|
30
|
-
private:
|
|
31
|
-
bool init(const llama_model & model);
|
|
32
|
-
|
|
33
|
-
int32_t layer_start = -1;
|
|
34
|
-
int32_t layer_end = -1;
|
|
35
|
-
|
|
36
|
-
std::vector<lm_ggml_context_ptr> ctxs;
|
|
37
|
-
std::vector<lm_ggml_backend_buffer_ptr> bufs;
|
|
38
|
-
|
|
39
|
-
std::vector<lm_ggml_tensor *> tensors; // per layer
|
|
40
|
-
};
|
|
41
|
-
|
|
42
|
-
//
|
|
43
|
-
// llama_adapter_lora
|
|
44
|
-
//
|
|
45
|
-
|
|
46
|
-
struct llama_adapter_lora_weight {
|
|
47
|
-
lm_ggml_tensor * a = nullptr;
|
|
48
|
-
lm_ggml_tensor * b = nullptr;
|
|
49
|
-
|
|
50
|
-
// get actual scale based on rank and alpha
|
|
51
|
-
float get_scale(float alpha, float adapter_scale) const {
|
|
52
|
-
const float rank = (float) b->ne[0];
|
|
53
|
-
const float scale = alpha ? adapter_scale * alpha / rank : adapter_scale;
|
|
54
|
-
return scale;
|
|
55
|
-
}
|
|
56
|
-
|
|
57
|
-
llama_adapter_lora_weight() = default;
|
|
58
|
-
llama_adapter_lora_weight(lm_ggml_tensor * a, lm_ggml_tensor * b) : a(a), b(b) {}
|
|
59
|
-
};
|
|
60
|
-
|
|
61
|
-
struct llama_adapter_lora {
|
|
62
|
-
// map tensor name to lora_a_b
|
|
63
|
-
std::unordered_map<std::string, llama_adapter_lora_weight> ab_map;
|
|
64
|
-
|
|
65
|
-
std::vector<lm_ggml_context_ptr> ctxs;
|
|
66
|
-
std::vector<lm_ggml_backend_buffer_ptr> bufs;
|
|
67
|
-
|
|
68
|
-
float alpha;
|
|
69
|
-
|
|
70
|
-
llama_adapter_lora() = default;
|
|
71
|
-
~llama_adapter_lora() = default;
|
|
72
|
-
|
|
73
|
-
llama_adapter_lora_weight * get_weight(lm_ggml_tensor * w);
|
|
74
|
-
};
|
|
75
|
-
|
|
76
|
-
using llama_adapter_loras = std::unordered_map<llama_adapter_lora *, float>;
|
package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-arch.h
DELETED
|
@@ -1,437 +0,0 @@
|
|
|
1
|
-
#pragma once
|
|
2
|
-
|
|
3
|
-
#include "ggml.h" // lm_ggml_op
|
|
4
|
-
|
|
5
|
-
#include <string>
|
|
6
|
-
|
|
7
|
-
//
|
|
8
|
-
// gguf constants (sync with gguf.py)
|
|
9
|
-
//
|
|
10
|
-
|
|
11
|
-
enum llm_arch {
|
|
12
|
-
LLM_ARCH_LLAMA,
|
|
13
|
-
LLM_ARCH_LLAMA4,
|
|
14
|
-
LLM_ARCH_DECI,
|
|
15
|
-
LLM_ARCH_FALCON,
|
|
16
|
-
LLM_ARCH_BAICHUAN,
|
|
17
|
-
LLM_ARCH_GROK,
|
|
18
|
-
LLM_ARCH_GPT2,
|
|
19
|
-
LLM_ARCH_GPTJ,
|
|
20
|
-
LLM_ARCH_GPTNEOX,
|
|
21
|
-
LLM_ARCH_MPT,
|
|
22
|
-
LLM_ARCH_STARCODER,
|
|
23
|
-
LLM_ARCH_REFACT,
|
|
24
|
-
LLM_ARCH_BERT,
|
|
25
|
-
LLM_ARCH_NOMIC_BERT,
|
|
26
|
-
LLM_ARCH_NOMIC_BERT_MOE,
|
|
27
|
-
LLM_ARCH_JINA_BERT_V2,
|
|
28
|
-
LLM_ARCH_BLOOM,
|
|
29
|
-
LLM_ARCH_STABLELM,
|
|
30
|
-
LLM_ARCH_QWEN,
|
|
31
|
-
LLM_ARCH_QWEN2,
|
|
32
|
-
LLM_ARCH_QWEN2MOE,
|
|
33
|
-
LLM_ARCH_QWEN2VL,
|
|
34
|
-
LLM_ARCH_QWEN3,
|
|
35
|
-
LLM_ARCH_QWEN3MOE,
|
|
36
|
-
LLM_ARCH_PHI2,
|
|
37
|
-
LLM_ARCH_PHI3,
|
|
38
|
-
LLM_ARCH_PHIMOE,
|
|
39
|
-
LLM_ARCH_PLAMO,
|
|
40
|
-
LLM_ARCH_CODESHELL,
|
|
41
|
-
LLM_ARCH_ORION,
|
|
42
|
-
LLM_ARCH_INTERNLM2,
|
|
43
|
-
LLM_ARCH_MINICPM,
|
|
44
|
-
LLM_ARCH_MINICPM3,
|
|
45
|
-
LLM_ARCH_GEMMA,
|
|
46
|
-
LLM_ARCH_GEMMA2,
|
|
47
|
-
LLM_ARCH_GEMMA3,
|
|
48
|
-
LLM_ARCH_STARCODER2,
|
|
49
|
-
LLM_ARCH_MAMBA,
|
|
50
|
-
LLM_ARCH_XVERSE,
|
|
51
|
-
LLM_ARCH_COMMAND_R,
|
|
52
|
-
LLM_ARCH_COHERE2,
|
|
53
|
-
LLM_ARCH_DBRX,
|
|
54
|
-
LLM_ARCH_OLMO,
|
|
55
|
-
LLM_ARCH_OLMO2,
|
|
56
|
-
LLM_ARCH_OLMOE,
|
|
57
|
-
LLM_ARCH_OPENELM,
|
|
58
|
-
LLM_ARCH_ARCTIC,
|
|
59
|
-
LLM_ARCH_DEEPSEEK,
|
|
60
|
-
LLM_ARCH_DEEPSEEK2,
|
|
61
|
-
LLM_ARCH_CHATGLM,
|
|
62
|
-
LLM_ARCH_GLM4,
|
|
63
|
-
LLM_ARCH_BITNET,
|
|
64
|
-
LLM_ARCH_T5,
|
|
65
|
-
LLM_ARCH_T5ENCODER,
|
|
66
|
-
LLM_ARCH_JAIS,
|
|
67
|
-
LLM_ARCH_NEMOTRON,
|
|
68
|
-
LLM_ARCH_EXAONE,
|
|
69
|
-
LLM_ARCH_RWKV6,
|
|
70
|
-
LLM_ARCH_RWKV6QWEN2,
|
|
71
|
-
LLM_ARCH_RWKV7,
|
|
72
|
-
LLM_ARCH_ARWKV7,
|
|
73
|
-
LLM_ARCH_GRANITE,
|
|
74
|
-
LLM_ARCH_GRANITE_MOE,
|
|
75
|
-
LLM_ARCH_CHAMELEON,
|
|
76
|
-
LLM_ARCH_WAVTOKENIZER_DEC,
|
|
77
|
-
LLM_ARCH_PLM,
|
|
78
|
-
LLM_ARCH_BAILINGMOE,
|
|
79
|
-
LLM_ARCH_UNKNOWN,
|
|
80
|
-
};
|
|
81
|
-
|
|
82
|
-
enum llm_kv {
|
|
83
|
-
LLM_KV_GENERAL_TYPE,
|
|
84
|
-
LLM_KV_GENERAL_ARCHITECTURE,
|
|
85
|
-
LLM_KV_GENERAL_QUANTIZATION_VERSION,
|
|
86
|
-
LLM_KV_GENERAL_ALIGNMENT,
|
|
87
|
-
LLM_KV_GENERAL_FILE_TYPE,
|
|
88
|
-
LLM_KV_GENERAL_NAME,
|
|
89
|
-
LLM_KV_GENERAL_AUTHOR,
|
|
90
|
-
LLM_KV_GENERAL_VERSION,
|
|
91
|
-
LLM_KV_GENERAL_URL,
|
|
92
|
-
LLM_KV_GENERAL_DESCRIPTION,
|
|
93
|
-
LLM_KV_GENERAL_LICENSE,
|
|
94
|
-
LLM_KV_GENERAL_SOURCE_URL,
|
|
95
|
-
LLM_KV_GENERAL_SOURCE_HF_REPO,
|
|
96
|
-
|
|
97
|
-
LLM_KV_VOCAB_SIZE,
|
|
98
|
-
LLM_KV_CONTEXT_LENGTH,
|
|
99
|
-
LLM_KV_EMBEDDING_LENGTH,
|
|
100
|
-
LLM_KV_FEATURES_LENGTH,
|
|
101
|
-
LLM_KV_BLOCK_COUNT,
|
|
102
|
-
LLM_KV_LEADING_DENSE_BLOCK_COUNT,
|
|
103
|
-
LLM_KV_FEED_FORWARD_LENGTH,
|
|
104
|
-
LLM_KV_EXPERT_FEED_FORWARD_LENGTH,
|
|
105
|
-
LLM_KV_EXPERT_SHARED_FEED_FORWARD_LENGTH,
|
|
106
|
-
LLM_KV_USE_PARALLEL_RESIDUAL,
|
|
107
|
-
LLM_KV_TENSOR_DATA_LAYOUT,
|
|
108
|
-
LLM_KV_EXPERT_COUNT,
|
|
109
|
-
LLM_KV_EXPERT_USED_COUNT,
|
|
110
|
-
LLM_KV_EXPERT_SHARED_COUNT,
|
|
111
|
-
LLM_KV_EXPERT_WEIGHTS_SCALE,
|
|
112
|
-
LLM_KV_EXPERT_WEIGHTS_NORM,
|
|
113
|
-
LLM_KV_EXPERT_GATING_FUNC,
|
|
114
|
-
LLM_KV_MOE_EVERY_N_LAYERS,
|
|
115
|
-
LLM_KV_POOLING_TYPE,
|
|
116
|
-
LLM_KV_LOGIT_SCALE,
|
|
117
|
-
LLM_KV_DECODER_START_TOKEN_ID,
|
|
118
|
-
LLM_KV_ATTN_LOGIT_SOFTCAPPING,
|
|
119
|
-
LLM_KV_FINAL_LOGIT_SOFTCAPPING,
|
|
120
|
-
LLM_KV_SWIN_NORM,
|
|
121
|
-
LLM_KV_RESCALE_EVERY_N_LAYERS,
|
|
122
|
-
LLM_KV_TIME_MIX_EXTRA_DIM,
|
|
123
|
-
LLM_KV_TIME_DECAY_EXTRA_DIM,
|
|
124
|
-
LLM_KV_RESIDUAL_SCALE,
|
|
125
|
-
LLM_KV_EMBEDDING_SCALE,
|
|
126
|
-
LLM_KV_TOKEN_SHIFT_COUNT,
|
|
127
|
-
LLM_KV_INTERLEAVE_MOE_LAYER_STEP,
|
|
128
|
-
|
|
129
|
-
LLM_KV_ATTENTION_HEAD_COUNT,
|
|
130
|
-
LLM_KV_ATTENTION_HEAD_COUNT_KV,
|
|
131
|
-
LLM_KV_ATTENTION_MAX_ALIBI_BIAS,
|
|
132
|
-
LLM_KV_ATTENTION_CLAMP_KQV,
|
|
133
|
-
LLM_KV_ATTENTION_KEY_LENGTH,
|
|
134
|
-
LLM_KV_ATTENTION_VALUE_LENGTH,
|
|
135
|
-
LLM_KV_ATTENTION_LAYERNORM_EPS,
|
|
136
|
-
LLM_KV_ATTENTION_LAYERNORM_RMS_EPS,
|
|
137
|
-
LLM_KV_ATTENTION_GROUPNORM_EPS,
|
|
138
|
-
LLM_KV_ATTENTION_GROUPNORM_GROUPS,
|
|
139
|
-
LLM_KV_ATTENTION_CAUSAL,
|
|
140
|
-
LLM_KV_ATTENTION_Q_LORA_RANK,
|
|
141
|
-
LLM_KV_ATTENTION_KV_LORA_RANK,
|
|
142
|
-
LLM_KV_ATTENTION_DECAY_LORA_RANK,
|
|
143
|
-
LLM_KV_ATTENTION_ICLR_LORA_RANK,
|
|
144
|
-
LLM_KV_ATTENTION_VALUE_RESIDUAL_MIX_LORA_RANK,
|
|
145
|
-
LLM_KV_ATTENTION_GATE_LORA_RANK,
|
|
146
|
-
LLM_KV_ATTENTION_RELATIVE_BUCKETS_COUNT,
|
|
147
|
-
LLM_KV_ATTENTION_SLIDING_WINDOW,
|
|
148
|
-
LLM_KV_ATTENTION_SCALE,
|
|
149
|
-
LLM_KV_ATTENTION_KEY_LENGTH_MLA,
|
|
150
|
-
LLM_KV_ATTENTION_VALUE_LENGTH_MLA,
|
|
151
|
-
|
|
152
|
-
LLM_KV_ROPE_DIMENSION_COUNT,
|
|
153
|
-
LLM_KV_ROPE_DIMENSION_SECTIONS,
|
|
154
|
-
LLM_KV_ROPE_FREQ_BASE,
|
|
155
|
-
LLM_KV_ROPE_SCALE_LINEAR,
|
|
156
|
-
LLM_KV_ROPE_SCALING_TYPE,
|
|
157
|
-
LLM_KV_ROPE_SCALING_FACTOR,
|
|
158
|
-
LLM_KV_ROPE_SCALING_ATTN_FACTOR,
|
|
159
|
-
LLM_KV_ROPE_SCALING_ORIG_CTX_LEN,
|
|
160
|
-
LLM_KV_ROPE_SCALING_FINETUNED,
|
|
161
|
-
LLM_KV_ROPE_SCALING_YARN_LOG_MUL,
|
|
162
|
-
|
|
163
|
-
LLM_KV_SPLIT_NO,
|
|
164
|
-
LLM_KV_SPLIT_COUNT,
|
|
165
|
-
LLM_KV_SPLIT_TENSORS_COUNT,
|
|
166
|
-
|
|
167
|
-
LLM_KV_SSM_INNER_SIZE,
|
|
168
|
-
LLM_KV_SSM_CONV_KERNEL,
|
|
169
|
-
LLM_KV_SSM_STATE_SIZE,
|
|
170
|
-
LLM_KV_SSM_TIME_STEP_RANK,
|
|
171
|
-
LLM_KV_SSM_DT_B_C_RMS,
|
|
172
|
-
|
|
173
|
-
LLM_KV_WKV_HEAD_SIZE,
|
|
174
|
-
|
|
175
|
-
LLM_KV_TOKENIZER_MODEL,
|
|
176
|
-
LLM_KV_TOKENIZER_PRE,
|
|
177
|
-
LLM_KV_TOKENIZER_LIST,
|
|
178
|
-
LLM_KV_TOKENIZER_TOKEN_TYPE,
|
|
179
|
-
LLM_KV_TOKENIZER_TOKEN_TYPE_COUNT,
|
|
180
|
-
LLM_KV_TOKENIZER_SCORES,
|
|
181
|
-
LLM_KV_TOKENIZER_MERGES,
|
|
182
|
-
LLM_KV_TOKENIZER_BOS_ID,
|
|
183
|
-
LLM_KV_TOKENIZER_EOS_ID,
|
|
184
|
-
LLM_KV_TOKENIZER_EOT_ID,
|
|
185
|
-
LLM_KV_TOKENIZER_EOM_ID,
|
|
186
|
-
LLM_KV_TOKENIZER_UNK_ID,
|
|
187
|
-
LLM_KV_TOKENIZER_SEP_ID,
|
|
188
|
-
LLM_KV_TOKENIZER_PAD_ID,
|
|
189
|
-
LLM_KV_TOKENIZER_CLS_ID,
|
|
190
|
-
LLM_KV_TOKENIZER_MASK_ID,
|
|
191
|
-
LLM_KV_TOKENIZER_ADD_BOS,
|
|
192
|
-
LLM_KV_TOKENIZER_ADD_EOS,
|
|
193
|
-
LLM_KV_TOKENIZER_ADD_PREFIX,
|
|
194
|
-
LLM_KV_TOKENIZER_REMOVE_EXTRA_WS,
|
|
195
|
-
LLM_KV_TOKENIZER_PRECOMPILED_CHARSMAP,
|
|
196
|
-
LLM_KV_TOKENIZER_HF_JSON,
|
|
197
|
-
LLM_KV_TOKENIZER_RWKV,
|
|
198
|
-
LLM_KV_TOKENIZER_CHAT_TEMPLATE,
|
|
199
|
-
LLM_KV_TOKENIZER_CHAT_TEMPLATE_N,
|
|
200
|
-
LLM_KV_TOKENIZER_FIM_PRE_ID,
|
|
201
|
-
LLM_KV_TOKENIZER_FIM_SUF_ID,
|
|
202
|
-
LLM_KV_TOKENIZER_FIM_MID_ID,
|
|
203
|
-
LLM_KV_TOKENIZER_FIM_PAD_ID,
|
|
204
|
-
LLM_KV_TOKENIZER_FIM_REP_ID,
|
|
205
|
-
LLM_KV_TOKENIZER_FIM_SEP_ID,
|
|
206
|
-
|
|
207
|
-
LLM_KV_ADAPTER_TYPE,
|
|
208
|
-
LLM_KV_ADAPTER_LORA_ALPHA,
|
|
209
|
-
|
|
210
|
-
LLM_KV_POSNET_EMBEDDING_LENGTH,
|
|
211
|
-
LLM_KV_POSNET_BLOCK_COUNT,
|
|
212
|
-
|
|
213
|
-
LLM_KV_CONVNEXT_EMBEDDING_LENGTH,
|
|
214
|
-
LLM_KV_CONVNEXT_BLOCK_COUNT,
|
|
215
|
-
|
|
216
|
-
// deprecated:
|
|
217
|
-
LLM_KV_TOKENIZER_PREFIX_ID,
|
|
218
|
-
LLM_KV_TOKENIZER_SUFFIX_ID,
|
|
219
|
-
LLM_KV_TOKENIZER_MIDDLE_ID,
|
|
220
|
-
};
|
|
221
|
-
|
|
222
|
-
enum llm_tensor {
|
|
223
|
-
LLM_TENSOR_TOKEN_EMBD,
|
|
224
|
-
LLM_TENSOR_TOKEN_EMBD_NORM,
|
|
225
|
-
LLM_TENSOR_TOKEN_TYPES,
|
|
226
|
-
LLM_TENSOR_POS_EMBD,
|
|
227
|
-
LLM_TENSOR_OUTPUT,
|
|
228
|
-
LLM_TENSOR_OUTPUT_NORM,
|
|
229
|
-
LLM_TENSOR_ROPE_FREQS,
|
|
230
|
-
LLM_TENSOR_ROPE_FACTORS_LONG,
|
|
231
|
-
LLM_TENSOR_ROPE_FACTORS_SHORT,
|
|
232
|
-
LLM_TENSOR_ATTN_Q,
|
|
233
|
-
LLM_TENSOR_ATTN_K,
|
|
234
|
-
LLM_TENSOR_ATTN_V,
|
|
235
|
-
LLM_TENSOR_ATTN_QKV,
|
|
236
|
-
LLM_TENSOR_ATTN_OUT,
|
|
237
|
-
LLM_TENSOR_ATTN_NORM,
|
|
238
|
-
LLM_TENSOR_ATTN_NORM_2,
|
|
239
|
-
LLM_TENSOR_ATTN_OUT_NORM,
|
|
240
|
-
LLM_TENSOR_ATTN_POST_NORM,
|
|
241
|
-
LLM_TENSOR_ATTN_ROT_EMBD,
|
|
242
|
-
LLM_TENSOR_FFN_GATE_INP,
|
|
243
|
-
LLM_TENSOR_FFN_GATE_INP_SHEXP,
|
|
244
|
-
LLM_TENSOR_FFN_NORM,
|
|
245
|
-
LLM_TENSOR_FFN_POST_NORM,
|
|
246
|
-
LLM_TENSOR_FFN_GATE,
|
|
247
|
-
LLM_TENSOR_FFN_DOWN,
|
|
248
|
-
LLM_TENSOR_FFN_UP,
|
|
249
|
-
LLM_TENSOR_FFN_ACT,
|
|
250
|
-
LLM_TENSOR_FFN_DOWN_EXP, // split experts for backward compatibility
|
|
251
|
-
LLM_TENSOR_FFN_GATE_EXP,
|
|
252
|
-
LLM_TENSOR_FFN_UP_EXP,
|
|
253
|
-
LLM_TENSOR_FFN_NORM_EXPS,
|
|
254
|
-
LLM_TENSOR_FFN_DOWN_EXPS, // merged experts
|
|
255
|
-
LLM_TENSOR_FFN_GATE_EXPS,
|
|
256
|
-
LLM_TENSOR_FFN_UP_EXPS,
|
|
257
|
-
LLM_TENSOR_FFN_DOWN_SHEXP,
|
|
258
|
-
LLM_TENSOR_FFN_GATE_SHEXP,
|
|
259
|
-
LLM_TENSOR_FFN_UP_SHEXP,
|
|
260
|
-
LLM_TENSOR_FFN_EXP_PROBS_B,
|
|
261
|
-
LLM_TENSOR_ATTN_Q_NORM,
|
|
262
|
-
LLM_TENSOR_ATTN_K_NORM,
|
|
263
|
-
LLM_TENSOR_LAYER_OUT_NORM,
|
|
264
|
-
LLM_TENSOR_POST_ATTN_NORM,
|
|
265
|
-
LLM_TENSOR_POST_MLP_NORM,
|
|
266
|
-
LLM_TENSOR_SSM_IN,
|
|
267
|
-
LLM_TENSOR_SSM_CONV1D,
|
|
268
|
-
LLM_TENSOR_SSM_X,
|
|
269
|
-
LLM_TENSOR_SSM_DT,
|
|
270
|
-
LLM_TENSOR_SSM_A,
|
|
271
|
-
LLM_TENSOR_SSM_D,
|
|
272
|
-
LLM_TENSOR_SSM_OUT,
|
|
273
|
-
LLM_TENSOR_TIME_MIX_W0,
|
|
274
|
-
LLM_TENSOR_TIME_MIX_W1,
|
|
275
|
-
LLM_TENSOR_TIME_MIX_W2,
|
|
276
|
-
LLM_TENSOR_TIME_MIX_A0,
|
|
277
|
-
LLM_TENSOR_TIME_MIX_A1,
|
|
278
|
-
LLM_TENSOR_TIME_MIX_A2,
|
|
279
|
-
LLM_TENSOR_TIME_MIX_V0,
|
|
280
|
-
LLM_TENSOR_TIME_MIX_V1,
|
|
281
|
-
LLM_TENSOR_TIME_MIX_V2,
|
|
282
|
-
LLM_TENSOR_TIME_MIX_G1,
|
|
283
|
-
LLM_TENSOR_TIME_MIX_G2,
|
|
284
|
-
LLM_TENSOR_TIME_MIX_K_K,
|
|
285
|
-
LLM_TENSOR_TIME_MIX_K_A,
|
|
286
|
-
LLM_TENSOR_TIME_MIX_R_K,
|
|
287
|
-
LLM_TENSOR_TIME_MIX_LERP_X,
|
|
288
|
-
LLM_TENSOR_TIME_MIX_LERP_W,
|
|
289
|
-
LLM_TENSOR_TIME_MIX_LERP_K,
|
|
290
|
-
LLM_TENSOR_TIME_MIX_LERP_V,
|
|
291
|
-
LLM_TENSOR_TIME_MIX_LERP_R,
|
|
292
|
-
LLM_TENSOR_TIME_MIX_LERP_G,
|
|
293
|
-
LLM_TENSOR_TIME_MIX_LERP_FUSED,
|
|
294
|
-
LLM_TENSOR_TIME_MIX_FIRST,
|
|
295
|
-
LLM_TENSOR_TIME_MIX_DECAY,
|
|
296
|
-
LLM_TENSOR_TIME_MIX_DECAY_W1,
|
|
297
|
-
LLM_TENSOR_TIME_MIX_DECAY_W2,
|
|
298
|
-
LLM_TENSOR_TIME_MIX_KEY,
|
|
299
|
-
LLM_TENSOR_TIME_MIX_VALUE,
|
|
300
|
-
LLM_TENSOR_TIME_MIX_RECEPTANCE,
|
|
301
|
-
LLM_TENSOR_TIME_MIX_GATE,
|
|
302
|
-
LLM_TENSOR_TIME_MIX_LN,
|
|
303
|
-
LLM_TENSOR_TIME_MIX_OUTPUT,
|
|
304
|
-
LLM_TENSOR_CHANNEL_MIX_LERP_K,
|
|
305
|
-
LLM_TENSOR_CHANNEL_MIX_LERP_R,
|
|
306
|
-
LLM_TENSOR_CHANNEL_MIX_KEY,
|
|
307
|
-
LLM_TENSOR_CHANNEL_MIX_RECEPTANCE,
|
|
308
|
-
LLM_TENSOR_CHANNEL_MIX_VALUE,
|
|
309
|
-
LLM_TENSOR_ATTN_Q_A,
|
|
310
|
-
LLM_TENSOR_ATTN_Q_B,
|
|
311
|
-
LLM_TENSOR_ATTN_KV_A_MQA,
|
|
312
|
-
LLM_TENSOR_ATTN_KV_B,
|
|
313
|
-
LLM_TENSOR_ATTN_K_B,
|
|
314
|
-
LLM_TENSOR_ATTN_V_B,
|
|
315
|
-
LLM_TENSOR_ATTN_Q_A_NORM,
|
|
316
|
-
LLM_TENSOR_ATTN_KV_A_NORM,
|
|
317
|
-
LLM_TENSOR_ATTN_SUB_NORM,
|
|
318
|
-
LLM_TENSOR_FFN_SUB_NORM,
|
|
319
|
-
LLM_TENSOR_DEC_ATTN_NORM,
|
|
320
|
-
LLM_TENSOR_DEC_ATTN_Q,
|
|
321
|
-
LLM_TENSOR_DEC_ATTN_K,
|
|
322
|
-
LLM_TENSOR_DEC_ATTN_V,
|
|
323
|
-
LLM_TENSOR_DEC_ATTN_OUT,
|
|
324
|
-
LLM_TENSOR_DEC_ATTN_REL_B,
|
|
325
|
-
LLM_TENSOR_DEC_CROSS_ATTN_NORM,
|
|
326
|
-
LLM_TENSOR_DEC_CROSS_ATTN_Q,
|
|
327
|
-
LLM_TENSOR_DEC_CROSS_ATTN_K,
|
|
328
|
-
LLM_TENSOR_DEC_CROSS_ATTN_V,
|
|
329
|
-
LLM_TENSOR_DEC_CROSS_ATTN_OUT,
|
|
330
|
-
LLM_TENSOR_DEC_CROSS_ATTN_REL_B,
|
|
331
|
-
LLM_TENSOR_DEC_FFN_NORM,
|
|
332
|
-
LLM_TENSOR_DEC_FFN_GATE,
|
|
333
|
-
LLM_TENSOR_DEC_FFN_DOWN,
|
|
334
|
-
LLM_TENSOR_DEC_FFN_UP,
|
|
335
|
-
LLM_TENSOR_DEC_OUTPUT_NORM,
|
|
336
|
-
LLM_TENSOR_ENC_ATTN_NORM,
|
|
337
|
-
LLM_TENSOR_ENC_ATTN_Q,
|
|
338
|
-
LLM_TENSOR_ENC_ATTN_K,
|
|
339
|
-
LLM_TENSOR_ENC_ATTN_V,
|
|
340
|
-
LLM_TENSOR_ENC_ATTN_OUT,
|
|
341
|
-
LLM_TENSOR_ENC_ATTN_REL_B,
|
|
342
|
-
LLM_TENSOR_ENC_FFN_NORM,
|
|
343
|
-
LLM_TENSOR_ENC_FFN_GATE,
|
|
344
|
-
LLM_TENSOR_ENC_FFN_DOWN,
|
|
345
|
-
LLM_TENSOR_ENC_FFN_UP,
|
|
346
|
-
LLM_TENSOR_ENC_OUTPUT_NORM,
|
|
347
|
-
LLM_TENSOR_CLS,
|
|
348
|
-
LLM_TENSOR_CLS_OUT,
|
|
349
|
-
LLM_TENSOR_CONV1D,
|
|
350
|
-
LLM_TENSOR_CONVNEXT_DW,
|
|
351
|
-
LLM_TENSOR_CONVNEXT_NORM,
|
|
352
|
-
LLM_TENSOR_CONVNEXT_PW1,
|
|
353
|
-
LLM_TENSOR_CONVNEXT_PW2,
|
|
354
|
-
LLM_TENSOR_CONVNEXT_GAMMA,
|
|
355
|
-
LLM_TENSOR_POS_NET_CONV1,
|
|
356
|
-
LLM_TENSOR_POS_NET_CONV2,
|
|
357
|
-
LLM_TENSOR_POS_NET_NORM,
|
|
358
|
-
LLM_TENSOR_POS_NET_NORM1,
|
|
359
|
-
LLM_TENSOR_POS_NET_NORM2,
|
|
360
|
-
LLM_TENSOR_POS_NET_ATTN_NORM,
|
|
361
|
-
LLM_TENSOR_POS_NET_ATTN_Q,
|
|
362
|
-
LLM_TENSOR_POS_NET_ATTN_K,
|
|
363
|
-
LLM_TENSOR_POS_NET_ATTN_V,
|
|
364
|
-
LLM_TENSOR_POS_NET_ATTN_OUT,
|
|
365
|
-
};
|
|
366
|
-
|
|
367
|
-
enum llm_tensor_layer {
|
|
368
|
-
LLM_TENSOR_LAYER_INPUT,
|
|
369
|
-
LLM_TENSOR_LAYER_REPEATING,
|
|
370
|
-
LLM_TENSOR_LAYER_OUTPUT,
|
|
371
|
-
};
|
|
372
|
-
|
|
373
|
-
struct LLM_KV {
|
|
374
|
-
LLM_KV(llm_arch arch, const char * suffix = nullptr);
|
|
375
|
-
|
|
376
|
-
llm_arch arch;
|
|
377
|
-
const char * suffix;
|
|
378
|
-
|
|
379
|
-
std::string operator()(llm_kv kv) const;
|
|
380
|
-
};
|
|
381
|
-
|
|
382
|
-
// helper to handle gguf constants
|
|
383
|
-
// usage:
|
|
384
|
-
//
|
|
385
|
-
// const auto tn = LLM_TN(LLM_ARCH_LLAMA);
|
|
386
|
-
//
|
|
387
|
-
// std::string name = tn(LLM_TENSOR_OUTPUT); -> "output"
|
|
388
|
-
// std::string name = tn(LLM_TENSOR_TOKEN_EMBD, "bias"); -> "token_embd.bias"
|
|
389
|
-
// std::string name = tn(LLM_TENSOR_ATTN_NORM, "weight", 3); -> "blk.3.attn_norm.weight"
|
|
390
|
-
//
|
|
391
|
-
struct LLM_TN_IMPL {
|
|
392
|
-
const llm_arch arch;
|
|
393
|
-
const llm_tensor tensor;
|
|
394
|
-
const char * const suffix;
|
|
395
|
-
const int bid;
|
|
396
|
-
const int xid;
|
|
397
|
-
|
|
398
|
-
std::string str() const;
|
|
399
|
-
|
|
400
|
-
operator std::string() const {
|
|
401
|
-
return str();
|
|
402
|
-
}
|
|
403
|
-
|
|
404
|
-
friend bool operator==(const std::string & str, const LLM_TN_IMPL & tn) {
|
|
405
|
-
return str == tn.str();
|
|
406
|
-
}
|
|
407
|
-
|
|
408
|
-
friend bool operator!=(const std::string & str, const LLM_TN_IMPL & tn) {
|
|
409
|
-
return str != tn.str();
|
|
410
|
-
}
|
|
411
|
-
};
|
|
412
|
-
|
|
413
|
-
struct LLM_TN {
|
|
414
|
-
LLM_TN(llm_arch arch) : arch(arch) {}
|
|
415
|
-
|
|
416
|
-
llm_arch arch;
|
|
417
|
-
|
|
418
|
-
LLM_TN_IMPL operator()(llm_tensor tensor, const char * suffix, int bid = -1, int xid = -1) const {
|
|
419
|
-
return { arch, tensor, suffix, bid, xid };
|
|
420
|
-
}
|
|
421
|
-
|
|
422
|
-
LLM_TN_IMPL operator()(llm_tensor tensor, int bid = -1, int xid = -1) const {
|
|
423
|
-
return { arch, tensor, nullptr, bid, xid };
|
|
424
|
-
}
|
|
425
|
-
};
|
|
426
|
-
|
|
427
|
-
|
|
428
|
-
struct llm_tensor_info {
|
|
429
|
-
llm_tensor_layer layer;
|
|
430
|
-
lm_ggml_op op;
|
|
431
|
-
};
|
|
432
|
-
|
|
433
|
-
const char * llm_arch_name(llm_arch arch);
|
|
434
|
-
|
|
435
|
-
llm_arch llm_arch_from_string(const std::string & name);
|
|
436
|
-
|
|
437
|
-
const llm_tensor_info & llm_tensor_info_for(llm_tensor tensor);
|
package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-batch.h
DELETED
|
@@ -1,89 +0,0 @@
|
|
|
1
|
-
#pragma once
|
|
2
|
-
|
|
3
|
-
#include "llama.h"
|
|
4
|
-
|
|
5
|
-
#include <array>
|
|
6
|
-
#include <vector>
|
|
7
|
-
|
|
8
|
-
// very similar to llama_batch,
|
|
9
|
-
// but has more metadata about sequences
|
|
10
|
-
struct llama_ubatch {
|
|
11
|
-
bool equal_seqs;
|
|
12
|
-
// TODO: whole_seqs for embeddings?
|
|
13
|
-
|
|
14
|
-
uint32_t n_tokens; // total tokens (n_seq_tokens * n_seqs)
|
|
15
|
-
uint32_t n_seq_tokens; // tokens per sequence
|
|
16
|
-
uint32_t n_seqs;
|
|
17
|
-
|
|
18
|
-
llama_token * token; // [n_tokens]
|
|
19
|
-
float * embd; // [n_embd, n_tokens]
|
|
20
|
-
llama_pos * pos; // [n_tokens]
|
|
21
|
-
int32_t * n_seq_id; // [n_seqs]
|
|
22
|
-
llama_seq_id ** seq_id; // [n_seqs]
|
|
23
|
-
int8_t * output; // [n_tokens]
|
|
24
|
-
};
|
|
25
|
-
|
|
26
|
-
struct llama_sbatch_seq {
|
|
27
|
-
int32_t n_seq_id;
|
|
28
|
-
|
|
29
|
-
llama_seq_id * seq_id;
|
|
30
|
-
|
|
31
|
-
size_t offset;
|
|
32
|
-
size_t length;
|
|
33
|
-
};
|
|
34
|
-
|
|
35
|
-
// sequence-length-aware batch splitting
|
|
36
|
-
struct llama_sbatch {
|
|
37
|
-
// tokens left in this batch
|
|
38
|
-
size_t n_tokens;
|
|
39
|
-
|
|
40
|
-
size_t n_embd;
|
|
41
|
-
|
|
42
|
-
bool logits_all; // TODO: remove once lctx.logits_all is removed too
|
|
43
|
-
|
|
44
|
-
// sorted indices into the batch
|
|
45
|
-
std::vector<int64_t> ids;
|
|
46
|
-
// batch indices of the output
|
|
47
|
-
std::vector<int64_t> out_ids;
|
|
48
|
-
std::vector<llama_sbatch_seq> seq;
|
|
49
|
-
|
|
50
|
-
const llama_batch * batch = nullptr;
|
|
51
|
-
|
|
52
|
-
// buffers for the ubatch
|
|
53
|
-
std::vector<llama_token> ubatch_token;
|
|
54
|
-
std::vector<float> ubatch_embd;
|
|
55
|
-
std::vector<llama_pos> ubatch_pos;
|
|
56
|
-
std::vector<int32_t> ubatch_n_seq_id;
|
|
57
|
-
std::vector<llama_seq_id *> ubatch_seq_id;
|
|
58
|
-
std::vector<int8_t> ubatch_output;
|
|
59
|
-
|
|
60
|
-
llama_ubatch reserve_ubatch(size_t n_ubatch, bool has_embd = false);
|
|
61
|
-
|
|
62
|
-
void add_seq_to_ubatch(llama_ubatch & ubatch, llama_sbatch_seq & seq, size_t length);
|
|
63
|
-
|
|
64
|
-
// simple split, unknown number of sequences of unequal lengths
|
|
65
|
-
llama_ubatch split_simple(size_t n_ubatch);
|
|
66
|
-
|
|
67
|
-
// make batches of equal-length sequences
|
|
68
|
-
llama_ubatch split_equal(size_t n_ubatch);
|
|
69
|
-
|
|
70
|
-
// sequence-wise split
|
|
71
|
-
llama_ubatch split_seq(size_t n_ubatch);
|
|
72
|
-
|
|
73
|
-
llama_sbatch() = default;
|
|
74
|
-
llama_sbatch(const llama_batch & batch, size_t n_embd, bool simple_split = false, bool logits_all = false);
|
|
75
|
-
};
|
|
76
|
-
|
|
77
|
-
// temporary allocate memory for the input batch if needed
|
|
78
|
-
struct llama_batch_allocr {
|
|
79
|
-
struct llama_batch batch;
|
|
80
|
-
|
|
81
|
-
std::array<llama_seq_id, 1> seq_id_0 = { 0 }; // default sequence id
|
|
82
|
-
std::vector<llama_pos> pos;
|
|
83
|
-
std::vector<int32_t> n_seq_id;
|
|
84
|
-
std::vector<llama_seq_id *> seq_id;
|
|
85
|
-
std::vector<int8_t> logits;
|
|
86
|
-
|
|
87
|
-
// optionally fulfill the batch returned by llama_batch_get_one
|
|
88
|
-
llama_batch_allocr(struct llama_batch in_batch, llama_pos p0);
|
|
89
|
-
};
|
package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-chat.h
DELETED
|
@@ -1,58 +0,0 @@
|
|
|
1
|
-
#pragma once
|
|
2
|
-
|
|
3
|
-
#include <string>
|
|
4
|
-
#include <vector>
|
|
5
|
-
#include <cstdint>
|
|
6
|
-
|
|
7
|
-
enum llm_chat_template {
|
|
8
|
-
LLM_CHAT_TEMPLATE_CHATML,
|
|
9
|
-
LLM_CHAT_TEMPLATE_LLAMA_2,
|
|
10
|
-
LLM_CHAT_TEMPLATE_LLAMA_2_SYS,
|
|
11
|
-
LLM_CHAT_TEMPLATE_LLAMA_2_SYS_BOS,
|
|
12
|
-
LLM_CHAT_TEMPLATE_LLAMA_2_SYS_STRIP,
|
|
13
|
-
LLM_CHAT_TEMPLATE_MISTRAL_V1,
|
|
14
|
-
LLM_CHAT_TEMPLATE_MISTRAL_V3,
|
|
15
|
-
LLM_CHAT_TEMPLATE_MISTRAL_V3_TEKKEN,
|
|
16
|
-
LLM_CHAT_TEMPLATE_MISTRAL_V7,
|
|
17
|
-
LLM_CHAT_TEMPLATE_MISTRAL_V7_TEKKEN,
|
|
18
|
-
LLM_CHAT_TEMPLATE_PHI_3,
|
|
19
|
-
LLM_CHAT_TEMPLATE_PHI_4,
|
|
20
|
-
LLM_CHAT_TEMPLATE_FALCON_3,
|
|
21
|
-
LLM_CHAT_TEMPLATE_ZEPHYR,
|
|
22
|
-
LLM_CHAT_TEMPLATE_MONARCH,
|
|
23
|
-
LLM_CHAT_TEMPLATE_GEMMA,
|
|
24
|
-
LLM_CHAT_TEMPLATE_ORION,
|
|
25
|
-
LLM_CHAT_TEMPLATE_OPENCHAT,
|
|
26
|
-
LLM_CHAT_TEMPLATE_VICUNA,
|
|
27
|
-
LLM_CHAT_TEMPLATE_VICUNA_ORCA,
|
|
28
|
-
LLM_CHAT_TEMPLATE_DEEPSEEK,
|
|
29
|
-
LLM_CHAT_TEMPLATE_DEEPSEEK_2,
|
|
30
|
-
LLM_CHAT_TEMPLATE_DEEPSEEK_3,
|
|
31
|
-
LLM_CHAT_TEMPLATE_COMMAND_R,
|
|
32
|
-
LLM_CHAT_TEMPLATE_LLAMA_3,
|
|
33
|
-
LLM_CHAT_TEMPLATE_CHATGLM_3,
|
|
34
|
-
LLM_CHAT_TEMPLATE_CHATGLM_4,
|
|
35
|
-
LLM_CHAT_TEMPLATE_GLMEDGE,
|
|
36
|
-
LLM_CHAT_TEMPLATE_MINICPM,
|
|
37
|
-
LLM_CHAT_TEMPLATE_EXAONE_3,
|
|
38
|
-
LLM_CHAT_TEMPLATE_RWKV_WORLD,
|
|
39
|
-
LLM_CHAT_TEMPLATE_GRANITE,
|
|
40
|
-
LLM_CHAT_TEMPLATE_GIGACHAT,
|
|
41
|
-
LLM_CHAT_TEMPLATE_MEGREZ,
|
|
42
|
-
LLM_CHAT_TEMPLATE_YANDEX,
|
|
43
|
-
LLM_CHAT_TEMPLATE_BAILING,
|
|
44
|
-
LLM_CHAT_TEMPLATE_LLAMA4,
|
|
45
|
-
LLM_CHAT_TEMPLATE_SMOLVLM,
|
|
46
|
-
LLM_CHAT_TEMPLATE_UNKNOWN,
|
|
47
|
-
};
|
|
48
|
-
|
|
49
|
-
struct llama_chat_message;
|
|
50
|
-
|
|
51
|
-
llm_chat_template llm_chat_template_from_str(const std::string & name);
|
|
52
|
-
|
|
53
|
-
llm_chat_template llm_chat_detect_template(const std::string & tmpl);
|
|
54
|
-
|
|
55
|
-
int32_t llm_chat_apply_template(
|
|
56
|
-
llm_chat_template tmpl,
|
|
57
|
-
const std::vector<const llama_chat_message *> & chat,
|
|
58
|
-
std::string & dest, bool add_ass);
|