cactus-react-native 0.2.10 → 1.0.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/Cactus.podspec +34 -0
- package/LICENSE +38 -0
- package/README.md +283 -722
- package/android/CMakeLists.txt +40 -0
- package/android/build.gradle +68 -44
- package/android/gradle.properties +5 -5
- package/android/src/main/AndroidManifest.xml +1 -3
- package/android/src/main/cpp/cpp-adapter.cpp +6 -0
- package/android/src/main/java/com/margelo/nitro/cactus/CactusPackage.kt +22 -0
- package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusCrypto.kt +38 -0
- package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusDeviceInfo.kt +24 -0
- package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusFileSystem.kt +227 -0
- package/android/src/main/jniLibs/arm64-v8a/{libcactus.so → libcactus.a} +0 -0
- package/android/src/main/jniLibs/arm64-v8a/libcactus_util.so +0 -0
- package/cpp/HybridCactus.cpp +123 -0
- package/cpp/HybridCactus.hpp +35 -0
- package/cpp/HybridCactusUtil.cpp +45 -0
- package/cpp/HybridCactusUtil.hpp +26 -0
- package/cpp/cactus_ffi.h +55 -0
- package/cpp/cactus_util.h +25 -0
- package/ios/HybridCactusCrypto.swift +37 -0
- package/ios/HybridCactusDeviceInfo.swift +32 -0
- package/ios/HybridCactusFileSystem.swift +234 -0
- package/ios/cactus.xcframework/{info.plist → Info.plist} +2 -37
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/cactus.h +8 -229
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/cactus_ffi.h +28 -229
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/engine.h +347 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ffi_utils.h +286 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/graph.h +319 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/kernel.h +254 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/kernel_utils.h +343 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Info.plist +0 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/cactus +0 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/cactus.h +11 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/cactus_ffi.h +55 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/engine.h +347 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/ffi_utils.h +286 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/graph.h +319 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/kernel.h +254 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/kernel_utils.h +343 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Info.plist +0 -0
- package/ios/cactus.xcframework/{tvos-arm64_x86_64-simulator → ios-arm64-simulator}/cactus.framework/_CodeSignature/CodeResources +1 -1
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/cactus +0 -0
- package/ios/cactus_util.xcframework/Info.plist +39 -0
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/cactus_util.h +25 -0
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/ios_utils.h +10 -0
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/logging.h +25 -0
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Info.plist +0 -0
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/cactus_util +0 -0
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/cactus_util.h +25 -0
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/ios_utils.h +10 -0
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/logging.h +25 -0
- package/ios/{cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework → cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework}/Info.plist +0 -0
- package/ios/{cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework → cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework}/_CodeSignature/CodeResources +36 -2
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/cactus_util +0 -0
- package/lib/module/api/Database.js +60 -0
- package/lib/module/api/Database.js.map +1 -0
- package/lib/module/classes/CactusLM.js +149 -0
- package/lib/module/classes/CactusLM.js.map +1 -0
- package/lib/module/config/CactusConfig.js +6 -0
- package/lib/module/config/CactusConfig.js.map +1 -0
- package/lib/module/constants/packageVersion.js +4 -0
- package/lib/module/constants/packageVersion.js.map +1 -0
- package/lib/module/hooks/useCactusLM.js +233 -0
- package/lib/module/hooks/useCactusLM.js.map +1 -0
- package/lib/module/index.js +9 -409
- package/lib/module/index.js.map +1 -1
- package/lib/module/native/Cactus.js +50 -0
- package/lib/module/native/Cactus.js.map +1 -0
- package/lib/module/native/CactusCrypto.js +10 -0
- package/lib/module/native/CactusCrypto.js.map +1 -0
- package/lib/module/native/CactusDeviceInfo.js +13 -0
- package/lib/module/native/CactusDeviceInfo.js.map +1 -0
- package/lib/module/native/CactusFileSystem.js +35 -0
- package/lib/module/native/CactusFileSystem.js.map +1 -0
- package/lib/module/native/CactusUtil.js +23 -0
- package/lib/module/native/CactusUtil.js.map +1 -0
- package/lib/module/native/index.js +8 -0
- package/lib/module/native/index.js.map +1 -0
- package/lib/module/specs/Cactus.nitro.js +4 -0
- package/lib/module/specs/Cactus.nitro.js.map +1 -0
- package/lib/module/specs/CactusCrypto.nitro.js +4 -0
- package/lib/module/specs/CactusCrypto.nitro.js.map +1 -0
- package/lib/module/specs/CactusDeviceInfo.nitro.js +4 -0
- package/lib/module/specs/CactusDeviceInfo.nitro.js.map +1 -0
- package/lib/module/specs/CactusFileSystem.nitro.js +4 -0
- package/lib/module/specs/CactusFileSystem.nitro.js.map +1 -0
- package/lib/module/specs/CactusUtil.nitro.js +4 -0
- package/lib/module/specs/CactusUtil.nitro.js.map +1 -0
- package/lib/module/telemetry/Telemetry.js +100 -0
- package/lib/module/telemetry/Telemetry.js.map +1 -0
- package/lib/module/types/CactusLM.js +2 -0
- package/lib/module/types/CactusLM.js.map +1 -0
- package/lib/module/types/CactusModel.js +2 -0
- package/lib/module/types/CactusModel.js.map +1 -0
- package/lib/module/utils/error.js +4 -0
- package/lib/module/utils/error.js.map +1 -0
- package/lib/typescript/package.json +1 -0
- package/lib/typescript/src/api/Database.d.ts +11 -0
- package/lib/typescript/src/api/Database.d.ts.map +1 -0
- package/lib/typescript/src/classes/CactusLM.d.ts +25 -0
- package/lib/typescript/src/classes/CactusLM.d.ts.map +1 -0
- package/lib/typescript/src/config/CactusConfig.d.ts +5 -0
- package/lib/typescript/src/config/CactusConfig.d.ts.map +1 -0
- package/lib/typescript/src/constants/packageVersion.d.ts +2 -0
- package/lib/typescript/src/constants/packageVersion.d.ts.map +1 -0
- package/lib/typescript/src/hooks/useCactusLM.d.ts +20 -0
- package/lib/typescript/src/hooks/useCactusLM.d.ts.map +1 -0
- package/lib/typescript/src/index.d.ts +6 -0
- package/lib/typescript/src/index.d.ts.map +1 -0
- package/lib/typescript/src/native/Cactus.d.ts +11 -0
- package/lib/typescript/src/native/Cactus.d.ts.map +1 -0
- package/lib/typescript/src/native/CactusCrypto.d.ts +5 -0
- package/lib/typescript/src/native/CactusCrypto.d.ts.map +1 -0
- package/lib/typescript/src/native/CactusDeviceInfo.d.ts +7 -0
- package/lib/typescript/src/native/CactusDeviceInfo.d.ts.map +1 -0
- package/lib/typescript/src/native/CactusFileSystem.d.ts +13 -0
- package/lib/typescript/src/native/CactusFileSystem.d.ts.map +1 -0
- package/lib/typescript/src/native/CactusUtil.d.ts +6 -0
- package/lib/typescript/src/native/CactusUtil.d.ts.map +1 -0
- package/lib/typescript/src/native/index.d.ts +6 -0
- package/lib/typescript/src/native/index.d.ts.map +1 -0
- package/lib/typescript/src/specs/Cactus.nitro.d.ts +13 -0
- package/lib/typescript/src/specs/Cactus.nitro.d.ts.map +1 -0
- package/lib/typescript/src/specs/CactusCrypto.nitro.d.ts +8 -0
- package/lib/typescript/src/specs/CactusCrypto.nitro.d.ts.map +1 -0
- package/lib/typescript/src/specs/CactusDeviceInfo.nitro.d.ts +16 -0
- package/lib/typescript/src/specs/CactusDeviceInfo.nitro.d.ts.map +1 -0
- package/lib/typescript/src/specs/CactusFileSystem.nitro.d.ts +16 -0
- package/lib/typescript/src/specs/CactusFileSystem.nitro.d.ts.map +1 -0
- package/lib/typescript/src/specs/CactusUtil.nitro.d.ts +10 -0
- package/lib/typescript/src/specs/CactusUtil.nitro.d.ts.map +1 -0
- package/lib/typescript/src/telemetry/Telemetry.d.ts +30 -0
- package/lib/typescript/src/telemetry/Telemetry.d.ts.map +1 -0
- package/lib/typescript/src/types/CactusLM.d.ts +65 -0
- package/lib/typescript/src/types/CactusLM.d.ts.map +1 -0
- package/lib/typescript/src/types/CactusModel.d.ts +12 -0
- package/lib/typescript/src/types/CactusModel.d.ts.map +1 -0
- package/lib/typescript/src/utils/error.d.ts +2 -0
- package/lib/typescript/src/utils/error.d.ts.map +1 -0
- package/nitro.json +31 -0
- package/nitrogen/generated/android/c++/JDeviceInfo.hpp +74 -0
- package/nitrogen/generated/android/c++/JFunc_void_double.hpp +74 -0
- package/nitrogen/generated/android/c++/JHybridCactusCryptoSpec.cpp +65 -0
- package/nitrogen/generated/android/c++/JHybridCactusCryptoSpec.hpp +65 -0
- package/nitrogen/generated/android/c++/JHybridCactusDeviceInfoSpec.cpp +85 -0
- package/nitrogen/generated/android/c++/JHybridCactusDeviceInfoSpec.hpp +66 -0
- package/nitrogen/generated/android/c++/JHybridCactusFileSystemSpec.cpp +192 -0
- package/nitrogen/generated/android/c++/JHybridCactusFileSystemSpec.hpp +73 -0
- package/nitrogen/generated/android/cactus+autolinking.cmake +87 -0
- package/nitrogen/generated/android/cactus+autolinking.gradle +27 -0
- package/nitrogen/generated/android/cactusOnLoad.cpp +86 -0
- package/nitrogen/generated/android/cactusOnLoad.hpp +25 -0
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/DeviceInfo.kt +50 -0
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/Func_void_double.kt +80 -0
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusCryptoSpec.kt +58 -0
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusDeviceInfoSpec.kt +62 -0
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusFileSystemSpec.kt +95 -0
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/cactusOnLoad.kt +35 -0
- package/nitrogen/generated/ios/Cactus+autolinking.rb +60 -0
- package/nitrogen/generated/ios/Cactus-Swift-Cxx-Bridge.cpp +122 -0
- package/nitrogen/generated/ios/Cactus-Swift-Cxx-Bridge.hpp +373 -0
- package/nitrogen/generated/ios/Cactus-Swift-Cxx-Umbrella.hpp +60 -0
- package/nitrogen/generated/ios/CactusAutolinking.mm +69 -0
- package/nitrogen/generated/ios/CactusAutolinking.swift +55 -0
- package/nitrogen/generated/ios/c++/HybridCactusCryptoSpecSwift.cpp +11 -0
- package/nitrogen/generated/ios/c++/HybridCactusCryptoSpecSwift.hpp +77 -0
- package/nitrogen/generated/ios/c++/HybridCactusDeviceInfoSpecSwift.cpp +11 -0
- package/nitrogen/generated/ios/c++/HybridCactusDeviceInfoSpecSwift.hpp +88 -0
- package/nitrogen/generated/ios/c++/HybridCactusFileSystemSpecSwift.cpp +11 -0
- package/nitrogen/generated/ios/c++/HybridCactusFileSystemSpecSwift.hpp +143 -0
- package/nitrogen/generated/ios/swift/DeviceInfo.swift +98 -0
- package/nitrogen/generated/ios/swift/Func_void.swift +47 -0
- package/nitrogen/generated/ios/swift/Func_void_DeviceInfo.swift +47 -0
- package/nitrogen/generated/ios/swift/Func_void_bool.swift +47 -0
- package/nitrogen/generated/ios/swift/Func_void_double.swift +47 -0
- package/nitrogen/generated/ios/swift/Func_void_std__exception_ptr.swift +47 -0
- package/nitrogen/generated/ios/swift/Func_void_std__optional_std__string_.swift +54 -0
- package/nitrogen/generated/ios/swift/Func_void_std__string.swift +47 -0
- package/nitrogen/generated/ios/swift/HybridCactusCryptoSpec.swift +57 -0
- package/nitrogen/generated/ios/swift/HybridCactusCryptoSpec_cxx.swift +139 -0
- package/nitrogen/generated/ios/swift/HybridCactusDeviceInfoSpec.swift +58 -0
- package/nitrogen/generated/ios/swift/HybridCactusDeviceInfoSpec_cxx.swift +164 -0
- package/nitrogen/generated/ios/swift/HybridCactusFileSystemSpec.swift +65 -0
- package/nitrogen/generated/ios/swift/HybridCactusFileSystemSpec_cxx.swift +303 -0
- package/nitrogen/generated/shared/c++/DeviceInfo.hpp +92 -0
- package/nitrogen/generated/shared/c++/HybridCactusCryptoSpec.cpp +21 -0
- package/nitrogen/generated/shared/c++/HybridCactusCryptoSpec.hpp +63 -0
- package/nitrogen/generated/shared/c++/HybridCactusDeviceInfoSpec.cpp +22 -0
- package/nitrogen/generated/shared/c++/HybridCactusDeviceInfoSpec.hpp +67 -0
- package/nitrogen/generated/shared/c++/HybridCactusFileSystemSpec.cpp +29 -0
- package/nitrogen/generated/shared/c++/HybridCactusFileSystemSpec.hpp +73 -0
- package/nitrogen/generated/shared/c++/HybridCactusSpec.cpp +26 -0
- package/nitrogen/generated/shared/c++/HybridCactusSpec.hpp +71 -0
- package/nitrogen/generated/shared/c++/HybridCactusUtilSpec.cpp +23 -0
- package/nitrogen/generated/shared/c++/HybridCactusUtilSpec.hpp +66 -0
- package/package.json +84 -143
- package/src/api/Database.ts +83 -0
- package/src/classes/CactusLM.ts +203 -0
- package/src/config/CactusConfig.ts +4 -0
- package/src/constants/packageVersion.ts +1 -0
- package/src/hooks/useCactusLM.ts +282 -0
- package/src/index.tsx +23 -0
- package/src/native/Cactus.ts +79 -0
- package/src/native/CactusCrypto.ts +11 -0
- package/src/native/CactusDeviceInfo.ts +18 -0
- package/src/native/CactusFileSystem.ts +47 -0
- package/src/native/CactusUtil.ts +27 -0
- package/src/native/index.ts +5 -0
- package/src/specs/Cactus.nitro.ts +16 -0
- package/src/specs/CactusCrypto.nitro.ts +6 -0
- package/src/specs/CactusDeviceInfo.nitro.ts +15 -0
- package/src/specs/CactusFileSystem.nitro.ts +21 -0
- package/src/specs/CactusUtil.nitro.ts +8 -0
- package/src/telemetry/Telemetry.ts +159 -0
- package/src/types/CactusLM.ts +71 -0
- package/src/types/CactusModel.ts +14 -0
- package/src/utils/error.ts +2 -0
- package/LICENSE.txt +0 -20
- package/android/src/main/CMakeLists.txt +0 -139
- package/android/src/main/java/com/cactus/Cactus.java +0 -1190
- package/android/src/main/java/com/cactus/CactusPackage.java +0 -48
- package/android/src/main/java/com/cactus/LlamaContext.java +0 -814
- package/android/src/main/jni-utils.h +0 -100
- package/android/src/main/jni.cpp +0 -1605
- package/android/src/main/jniLibs/arm64-v8a/libcactus_v8.so +0 -0
- package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2.so +0 -0
- package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2_dotprod.so +0 -0
- package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2_dotprod_i8mm.so +0 -0
- package/android/src/main/jniLibs/arm64-v8a/libcactus_v8_2_i8mm.so +0 -0
- package/android/src/newarch/java/com/cactus/CactusModule.java +0 -206
- package/android/src/oldarch/java/com/cactus/CactusModule.java +0 -205
- package/cactus-react-native.podspec +0 -42
- package/ios/CMakeLists.txt +0 -131
- package/ios/Cactus.h +0 -6
- package/ios/Cactus.mm +0 -681
- package/ios/CactusContext.h +0 -81
- package/ios/CactusContext.mm +0 -1032
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/chat.h +0 -145
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/common.h +0 -674
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-alloc.h +0 -76
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-backend-impl.h +0 -255
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-backend.h +0 -354
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-common.h +0 -1857
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-cpp.h +0 -39
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-cpu.h +0 -143
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-impl.h +0 -601
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-metal-impl.h +0 -622
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-metal.h +0 -66
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-opt.h +0 -237
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-quants.h +0 -100
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml-threading.h +0 -14
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/ggml.h +0 -2202
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/gguf.h +0 -202
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/json.hpp +0 -24766
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-adapter.h +0 -76
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-arch.h +0 -437
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-batch.h +0 -89
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-chat.h +0 -58
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-context.h +0 -276
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-cparams.h +0 -39
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-cpp.h +0 -30
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-grammar.h +0 -173
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-graph.h +0 -640
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-hparams.h +0 -190
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-impl.h +0 -61
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-io.h +0 -35
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-kv-cache.h +0 -515
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-memory.h +0 -32
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-mmap.h +0 -68
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-model-loader.h +0 -169
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-model-saver.h +0 -37
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-model.h +0 -425
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-sampling.h +0 -32
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama-vocab.h +0 -131
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/llama.h +0 -1376
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/log.h +0 -103
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/minja/chat-template.hpp +0 -542
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/minja/minja.hpp +0 -2974
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/sampling.h +0 -107
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/unicode-data.h +0 -20
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/unicode.h +0 -66
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/ggml-llama.metallib +0 -0
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/cactus.h +0 -232
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/cactus_ffi.h +0 -256
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/chat.h +0 -145
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/common.h +0 -674
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-alloc.h +0 -76
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend-impl.h +0 -255
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend.h +0 -354
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-common.h +0 -1857
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpp.h +0 -39
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpu.h +0 -143
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-impl.h +0 -601
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal-impl.h +0 -622
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal.h +0 -66
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-opt.h +0 -237
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-quants.h +0 -100
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml-threading.h +0 -14
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/ggml.h +0 -2202
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/gguf.h +0 -202
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/json.hpp +0 -24766
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-adapter.h +0 -76
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-arch.h +0 -437
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-batch.h +0 -89
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-chat.h +0 -58
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-context.h +0 -276
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-cparams.h +0 -39
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-cpp.h +0 -30
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-grammar.h +0 -173
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-graph.h +0 -640
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-hparams.h +0 -190
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-impl.h +0 -61
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-io.h +0 -35
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-kv-cache.h +0 -515
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-memory.h +0 -32
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-mmap.h +0 -68
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-loader.h +0 -169
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-saver.h +0 -37
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-model.h +0 -425
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-sampling.h +0 -32
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama-vocab.h +0 -131
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/llama.h +0 -1376
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/log.h +0 -103
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/minja/chat-template.hpp +0 -542
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/minja/minja.hpp +0 -2974
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/sampling.h +0 -107
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/unicode-data.h +0 -20
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/Headers/unicode.h +0 -66
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/cactus +0 -0
- package/ios/cactus.xcframework/ios-arm64_x86_64-simulator/cactus.framework/ggml-llama-sim.metallib +0 -0
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/cactus.h +0 -232
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/cactus_ffi.h +0 -256
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/chat.h +0 -145
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/common.h +0 -674
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-alloc.h +0 -76
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-backend-impl.h +0 -255
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-backend.h +0 -354
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-common.h +0 -1857
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-cpp.h +0 -39
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-cpu.h +0 -143
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-impl.h +0 -601
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-metal-impl.h +0 -622
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-metal.h +0 -66
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-opt.h +0 -237
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-quants.h +0 -100
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml-threading.h +0 -14
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/ggml.h +0 -2202
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/gguf.h +0 -202
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/json.hpp +0 -24766
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-adapter.h +0 -76
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-arch.h +0 -437
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-batch.h +0 -89
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-chat.h +0 -58
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-context.h +0 -276
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-cparams.h +0 -39
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-cpp.h +0 -30
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-grammar.h +0 -173
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-graph.h +0 -640
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-hparams.h +0 -190
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-impl.h +0 -61
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-io.h +0 -35
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-kv-cache.h +0 -515
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-memory.h +0 -32
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-mmap.h +0 -68
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-model-loader.h +0 -169
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-model-saver.h +0 -37
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-model.h +0 -425
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-sampling.h +0 -32
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama-vocab.h +0 -131
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/llama.h +0 -1376
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/log.h +0 -103
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/minja/chat-template.hpp +0 -542
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/minja/minja.hpp +0 -2974
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/sampling.h +0 -107
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/unicode-data.h +0 -20
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Headers/unicode.h +0 -66
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/Info.plist +0 -0
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/cactus +0 -0
- package/ios/cactus.xcframework/tvos-arm64/cactus.framework/ggml-llama.metallib +0 -0
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/cactus.h +0 -232
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/cactus_ffi.h +0 -256
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/chat.h +0 -145
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/common.h +0 -674
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-alloc.h +0 -76
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend-impl.h +0 -255
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-backend.h +0 -354
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-common.h +0 -1857
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpp.h +0 -39
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-cpu.h +0 -143
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-impl.h +0 -601
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal-impl.h +0 -622
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-metal.h +0 -66
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-opt.h +0 -237
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-quants.h +0 -100
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml-threading.h +0 -14
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/ggml.h +0 -2202
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/gguf.h +0 -202
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/json-schema-to-grammar.h +0 -21
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/json.hpp +0 -24766
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-adapter.h +0 -76
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-arch.h +0 -437
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-batch.h +0 -89
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-chat.h +0 -58
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-context.h +0 -276
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-cparams.h +0 -39
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-cpp.h +0 -30
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-grammar.h +0 -173
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-graph.h +0 -640
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-hparams.h +0 -190
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-impl.h +0 -61
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-io.h +0 -35
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-kv-cache.h +0 -515
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-memory.h +0 -32
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-mmap.h +0 -68
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-loader.h +0 -169
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-model-saver.h +0 -37
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-model.h +0 -425
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-sampling.h +0 -32
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama-vocab.h +0 -131
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/llama.h +0 -1376
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/log.h +0 -103
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/minja/chat-template.hpp +0 -542
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/minja/minja.hpp +0 -2974
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/sampling.h +0 -107
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/unicode-data.h +0 -20
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Headers/unicode.h +0 -66
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/Info.plist +0 -0
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/cactus +0 -0
- package/ios/cactus.xcframework/tvos-arm64_x86_64-simulator/cactus.framework/ggml-llama-sim.metallib +0 -0
- package/lib/commonjs/NativeCactus.js +0 -9
- package/lib/commonjs/NativeCactus.js.map +0 -1
- package/lib/commonjs/agent.js +0 -73
- package/lib/commonjs/agent.js.map +0 -1
- package/lib/commonjs/chat.js +0 -73
- package/lib/commonjs/chat.js.map +0 -1
- package/lib/commonjs/index.js +0 -523
- package/lib/commonjs/index.js.map +0 -1
- package/lib/commonjs/lm.js +0 -272
- package/lib/commonjs/lm.js.map +0 -1
- package/lib/commonjs/package.json +0 -1
- package/lib/commonjs/projectId.js +0 -8
- package/lib/commonjs/projectId.js.map +0 -1
- package/lib/commonjs/remote.js +0 -100
- package/lib/commonjs/remote.js.map +0 -1
- package/lib/commonjs/telemetry.js +0 -102
- package/lib/commonjs/telemetry.js.map +0 -1
- package/lib/commonjs/tools.js +0 -72
- package/lib/commonjs/tools.js.map +0 -1
- package/lib/commonjs/tts.js +0 -29
- package/lib/commonjs/tts.js.map +0 -1
- package/lib/commonjs/vlm.js +0 -221
- package/lib/commonjs/vlm.js.map +0 -1
- package/lib/module/NativeCactus.js +0 -5
- package/lib/module/NativeCactus.js.map +0 -1
- package/lib/module/agent.js +0 -68
- package/lib/module/agent.js.map +0 -1
- package/lib/module/chat.js +0 -67
- package/lib/module/chat.js.map +0 -1
- package/lib/module/lm.js +0 -267
- package/lib/module/lm.js.map +0 -1
- package/lib/module/projectId.js +0 -4
- package/lib/module/projectId.js.map +0 -1
- package/lib/module/remote.js +0 -91
- package/lib/module/remote.js.map +0 -1
- package/lib/module/telemetry.js +0 -97
- package/lib/module/telemetry.js.map +0 -1
- package/lib/module/tools.js +0 -66
- package/lib/module/tools.js.map +0 -1
- package/lib/module/tts.js +0 -24
- package/lib/module/tts.js.map +0 -1
- package/lib/module/vlm.js +0 -216
- package/lib/module/vlm.js.map +0 -1
- package/lib/typescript/NativeCactus.d.ts +0 -252
- package/lib/typescript/NativeCactus.d.ts.map +0 -1
- package/lib/typescript/agent.d.ts +0 -31
- package/lib/typescript/agent.d.ts.map +0 -1
- package/lib/typescript/chat.d.ts +0 -23
- package/lib/typescript/chat.d.ts.map +0 -1
- package/lib/typescript/index.d.ts +0 -114
- package/lib/typescript/index.d.ts.map +0 -1
- package/lib/typescript/lm.d.ts +0 -36
- package/lib/typescript/lm.d.ts.map +0 -1
- package/lib/typescript/projectId.d.ts +0 -2
- package/lib/typescript/projectId.d.ts.map +0 -1
- package/lib/typescript/remote.d.ts +0 -8
- package/lib/typescript/remote.d.ts.map +0 -1
- package/lib/typescript/telemetry.d.ts +0 -25
- package/lib/typescript/telemetry.d.ts.map +0 -1
- package/lib/typescript/tools.d.ts +0 -36
- package/lib/typescript/tools.d.ts.map +0 -1
- package/lib/typescript/tts.d.ts +0 -10
- package/lib/typescript/tts.d.ts.map +0 -1
- package/lib/typescript/vlm.d.ts +0 -33
- package/lib/typescript/vlm.d.ts.map +0 -1
- package/scripts/postInstall.js +0 -33
- package/src/NativeCactus.ts +0 -317
- package/src/agent.ts +0 -112
- package/src/chat.ts +0 -91
- package/src/index.ts +0 -662
- package/src/lm.ts +0 -324
- package/src/projectId.ts +0 -1
- package/src/remote.ts +0 -113
- package/src/telemetry.ts +0 -137
- package/src/tools.ts +0 -94
- package/src/tts.ts +0 -42
- package/src/vlm.ts +0 -276
|
@@ -1,103 +0,0 @@
|
|
|
1
|
-
#pragma once
|
|
2
|
-
|
|
3
|
-
#include "ggml.h" // for lm_ggml_log_level
|
|
4
|
-
|
|
5
|
-
#define LOG_CLR_TO_EOL "\033[K\r"
|
|
6
|
-
#define LOG_COL_DEFAULT "\033[0m"
|
|
7
|
-
#define LOG_COL_BOLD "\033[1m"
|
|
8
|
-
#define LOG_COL_RED "\033[31m"
|
|
9
|
-
#define LOG_COL_GREEN "\033[32m"
|
|
10
|
-
#define LOG_COL_YELLOW "\033[33m"
|
|
11
|
-
#define LOG_COL_BLUE "\033[34m"
|
|
12
|
-
#define LOG_COL_MAGENTA "\033[35m"
|
|
13
|
-
#define LOG_COL_CYAN "\033[36m"
|
|
14
|
-
#define LOG_COL_WHITE "\033[37m"
|
|
15
|
-
|
|
16
|
-
#ifndef __GNUC__
|
|
17
|
-
# define LOG_ATTRIBUTE_FORMAT(...)
|
|
18
|
-
#elif defined(__MINGW32__) && !defined(__clang__)
|
|
19
|
-
# define LOG_ATTRIBUTE_FORMAT(...) __attribute__((format(gnu_printf, __VA_ARGS__)))
|
|
20
|
-
#else
|
|
21
|
-
# define LOG_ATTRIBUTE_FORMAT(...) __attribute__((format(printf, __VA_ARGS__)))
|
|
22
|
-
#endif
|
|
23
|
-
|
|
24
|
-
#define LOG_DEFAULT_DEBUG 1
|
|
25
|
-
#define LOG_DEFAULT_LLAMA 0
|
|
26
|
-
|
|
27
|
-
// needed by the LOG_TMPL macro to avoid computing log arguments if the verbosity lower
|
|
28
|
-
// set via common_log_set_verbosity()
|
|
29
|
-
extern int common_log_verbosity_thold;
|
|
30
|
-
|
|
31
|
-
void common_log_set_verbosity_thold(int verbosity); // not thread-safe
|
|
32
|
-
|
|
33
|
-
// the common_log uses an internal worker thread to print/write log messages
|
|
34
|
-
// when the worker thread is paused, incoming log messages are discarded
|
|
35
|
-
struct common_log;
|
|
36
|
-
|
|
37
|
-
struct common_log * common_log_init();
|
|
38
|
-
struct common_log * common_log_main(); // singleton, automatically destroys itself on exit
|
|
39
|
-
void common_log_pause (struct common_log * log); // pause the worker thread, not thread-safe
|
|
40
|
-
void common_log_resume(struct common_log * log); // resume the worker thread, not thread-safe
|
|
41
|
-
void common_log_free (struct common_log * log);
|
|
42
|
-
|
|
43
|
-
LOG_ATTRIBUTE_FORMAT(3, 4)
|
|
44
|
-
void common_log_add(struct common_log * log, enum lm_ggml_log_level level, const char * fmt, ...);
|
|
45
|
-
|
|
46
|
-
// defaults: file = NULL, colors = false, prefix = false, timestamps = false
|
|
47
|
-
//
|
|
48
|
-
// regular log output:
|
|
49
|
-
//
|
|
50
|
-
// lm_ggml_backend_metal_log_allocated_size: allocated buffer, size = 6695.84 MiB, ( 6695.91 / 21845.34)
|
|
51
|
-
// llm_load_tensors: ggml ctx size = 0.27 MiB
|
|
52
|
-
// llm_load_tensors: offloading 32 repeating layers to GPU
|
|
53
|
-
// llm_load_tensors: offloading non-repeating layers to GPU
|
|
54
|
-
//
|
|
55
|
-
// with prefix = true, timestamps = true, the log output will look like this:
|
|
56
|
-
//
|
|
57
|
-
// 0.00.035.060 D lm_ggml_backend_metal_log_allocated_size: allocated buffer, size = 6695.84 MiB, ( 6695.91 / 21845.34)
|
|
58
|
-
// 0.00.035.064 I llm_load_tensors: ggml ctx size = 0.27 MiB
|
|
59
|
-
// 0.00.090.578 I llm_load_tensors: offloading 32 repeating layers to GPU
|
|
60
|
-
// 0.00.090.579 I llm_load_tensors: offloading non-repeating layers to GPU
|
|
61
|
-
//
|
|
62
|
-
// I - info (stdout, V = 0)
|
|
63
|
-
// W - warning (stderr, V = 0)
|
|
64
|
-
// E - error (stderr, V = 0)
|
|
65
|
-
// D - debug (stderr, V = LOG_DEFAULT_DEBUG)
|
|
66
|
-
//
|
|
67
|
-
|
|
68
|
-
void common_log_set_file (struct common_log * log, const char * file); // not thread-safe
|
|
69
|
-
void common_log_set_colors (struct common_log * log, bool colors); // not thread-safe
|
|
70
|
-
void common_log_set_prefix (struct common_log * log, bool prefix); // whether to output prefix to each log
|
|
71
|
-
void common_log_set_timestamps(struct common_log * log, bool timestamps); // whether to output timestamps in the prefix
|
|
72
|
-
|
|
73
|
-
// helper macros for logging
|
|
74
|
-
// use these to avoid computing log arguments if the verbosity of the log is higher than the threshold
|
|
75
|
-
//
|
|
76
|
-
// for example:
|
|
77
|
-
//
|
|
78
|
-
// LOG_DBG("this is a debug message: %d\n", expensive_function());
|
|
79
|
-
//
|
|
80
|
-
// this will avoid calling expensive_function() if LOG_DEFAULT_DEBUG > common_log_verbosity_thold
|
|
81
|
-
//
|
|
82
|
-
|
|
83
|
-
#define LOG_TMPL(level, verbosity, ...) \
|
|
84
|
-
do { \
|
|
85
|
-
if ((verbosity) <= common_log_verbosity_thold) { \
|
|
86
|
-
common_log_add(common_log_main(), (level), __VA_ARGS__); \
|
|
87
|
-
} \
|
|
88
|
-
} while (0)
|
|
89
|
-
|
|
90
|
-
#define LOG(...) LOG_TMPL(LM_GGML_LOG_LEVEL_NONE, 0, __VA_ARGS__)
|
|
91
|
-
#define LOGV(verbosity, ...) LOG_TMPL(LM_GGML_LOG_LEVEL_NONE, verbosity, __VA_ARGS__)
|
|
92
|
-
|
|
93
|
-
#define LOG_INF(...) LOG_TMPL(LM_GGML_LOG_LEVEL_INFO, 0, __VA_ARGS__)
|
|
94
|
-
#define LOG_WRN(...) LOG_TMPL(LM_GGML_LOG_LEVEL_WARN, 0, __VA_ARGS__)
|
|
95
|
-
#define LOG_ERR(...) LOG_TMPL(LM_GGML_LOG_LEVEL_ERROR, 0, __VA_ARGS__)
|
|
96
|
-
#define LOG_DBG(...) LOG_TMPL(LM_GGML_LOG_LEVEL_DEBUG, LOG_DEFAULT_DEBUG, __VA_ARGS__)
|
|
97
|
-
#define LOG_CNT(...) LOG_TMPL(LM_GGML_LOG_LEVEL_CONT, 0, __VA_ARGS__)
|
|
98
|
-
|
|
99
|
-
#define LOG_INFV(verbosity, ...) LOG_TMPL(LM_GGML_LOG_LEVEL_INFO, verbosity, __VA_ARGS__)
|
|
100
|
-
#define LOG_WRNV(verbosity, ...) LOG_TMPL(LM_GGML_LOG_LEVEL_WARN, verbosity, __VA_ARGS__)
|
|
101
|
-
#define LOG_ERRV(verbosity, ...) LOG_TMPL(LM_GGML_LOG_LEVEL_ERROR, verbosity, __VA_ARGS__)
|
|
102
|
-
#define LOG_DBGV(verbosity, ...) LOG_TMPL(LM_GGML_LOG_LEVEL_DEBUG, verbosity, __VA_ARGS__)
|
|
103
|
-
#define LOG_CNTV(verbosity, ...) LOG_TMPL(LM_GGML_LOG_LEVEL_CONT, verbosity, __VA_ARGS__)
|
|
@@ -1,542 +0,0 @@
|
|
|
1
|
-
/*
|
|
2
|
-
Copyright 2024 Google LLC
|
|
3
|
-
|
|
4
|
-
Use of this source code is governed by an MIT-style
|
|
5
|
-
license that can be found in the LICENSE file or at
|
|
6
|
-
https://opensource.org/licenses/MIT.
|
|
7
|
-
*/
|
|
8
|
-
// SPDX-License-Identifier: MIT
|
|
9
|
-
#pragma once
|
|
10
|
-
|
|
11
|
-
#include "minja.hpp"
|
|
12
|
-
|
|
13
|
-
#include <chrono>
|
|
14
|
-
#include <cstddef>
|
|
15
|
-
#include <cstdio>
|
|
16
|
-
#include <ctime>
|
|
17
|
-
#include <exception>
|
|
18
|
-
#include <iomanip>
|
|
19
|
-
#include <memory>
|
|
20
|
-
#include <sstream>
|
|
21
|
-
#include <stdexcept>
|
|
22
|
-
#include <string>
|
|
23
|
-
#include <vector>
|
|
24
|
-
|
|
25
|
-
#include "../json.hpp"
|
|
26
|
-
|
|
27
|
-
using json = nlohmann::ordered_json;
|
|
28
|
-
|
|
29
|
-
namespace minja {
|
|
30
|
-
|
|
31
|
-
struct chat_template_caps {
|
|
32
|
-
bool supports_tools = false;
|
|
33
|
-
bool supports_tool_calls = false;
|
|
34
|
-
bool supports_tool_responses = false;
|
|
35
|
-
bool supports_system_role = false;
|
|
36
|
-
bool supports_parallel_tool_calls = false;
|
|
37
|
-
bool supports_tool_call_id = false;
|
|
38
|
-
// meta-llama/Llama-3.1-8B-Instruct expects arguments to be an object.
|
|
39
|
-
// Most other templates (and OpenAI's API) expect the arguments object to be stringified.
|
|
40
|
-
bool requires_object_arguments = false;
|
|
41
|
-
// CohereForAI/c4ai-command-r-plus simple variant
|
|
42
|
-
bool requires_non_null_content = false;
|
|
43
|
-
// MiniMaxAI/MiniMax-Text-01 special
|
|
44
|
-
bool requires_typed_content = false;
|
|
45
|
-
};
|
|
46
|
-
|
|
47
|
-
struct chat_template_inputs {
|
|
48
|
-
nlohmann::ordered_json messages;
|
|
49
|
-
nlohmann::ordered_json tools;
|
|
50
|
-
bool add_generation_prompt = true;
|
|
51
|
-
nlohmann::ordered_json extra_context;
|
|
52
|
-
std::chrono::system_clock::time_point now = std::chrono::system_clock::now();
|
|
53
|
-
};
|
|
54
|
-
|
|
55
|
-
struct chat_template_options {
|
|
56
|
-
bool apply_polyfills = true;
|
|
57
|
-
bool use_bos_token = true;
|
|
58
|
-
bool use_eos_token = true;
|
|
59
|
-
bool define_strftime_now = true;
|
|
60
|
-
|
|
61
|
-
bool polyfill_tools = true;
|
|
62
|
-
bool polyfill_tool_call_examples = true;
|
|
63
|
-
bool polyfill_tool_calls = true;
|
|
64
|
-
bool polyfill_tool_responses = true;
|
|
65
|
-
bool polyfill_system_role = true;
|
|
66
|
-
bool polyfill_object_arguments = true;
|
|
67
|
-
bool polyfill_typed_content = true;
|
|
68
|
-
};
|
|
69
|
-
|
|
70
|
-
class chat_template {
|
|
71
|
-
|
|
72
|
-
private:
|
|
73
|
-
chat_template_caps caps_;
|
|
74
|
-
std::string source_;
|
|
75
|
-
std::string bos_token_;
|
|
76
|
-
std::string eos_token_;
|
|
77
|
-
std::shared_ptr<minja::TemplateNode> template_root_;
|
|
78
|
-
std::string tool_call_example_;
|
|
79
|
-
|
|
80
|
-
std::string try_raw_render(
|
|
81
|
-
const nlohmann::ordered_json & messages,
|
|
82
|
-
const nlohmann::ordered_json & tools,
|
|
83
|
-
bool add_generation_prompt,
|
|
84
|
-
const nlohmann::ordered_json & extra_context = nlohmann::ordered_json()) const
|
|
85
|
-
{
|
|
86
|
-
try {
|
|
87
|
-
chat_template_inputs inputs;
|
|
88
|
-
inputs.messages = messages;
|
|
89
|
-
inputs.tools = tools;
|
|
90
|
-
inputs.add_generation_prompt = add_generation_prompt;
|
|
91
|
-
inputs.extra_context = extra_context;
|
|
92
|
-
// Use fixed date for tests
|
|
93
|
-
inputs.now = std::chrono::system_clock::from_time_t(0);
|
|
94
|
-
|
|
95
|
-
chat_template_options opts;
|
|
96
|
-
opts.apply_polyfills = false;
|
|
97
|
-
|
|
98
|
-
auto prompt = apply(inputs, opts);
|
|
99
|
-
// fprintf(stderr, "try_raw_render: %s\n", prompt.c_str());
|
|
100
|
-
return prompt;
|
|
101
|
-
} catch (const std::exception & e) {
|
|
102
|
-
(void)e; // Suppress unused variable warning in MSVC builds.
|
|
103
|
-
// fprintf(stderr, "try_raw_render error: %s\n", e.what());
|
|
104
|
-
return "";
|
|
105
|
-
}
|
|
106
|
-
}
|
|
107
|
-
|
|
108
|
-
public:
|
|
109
|
-
|
|
110
|
-
chat_template(const std::string & source, const std::string & bos_token, const std::string & eos_token)
|
|
111
|
-
: source_(source), bos_token_(bos_token), eos_token_(eos_token)
|
|
112
|
-
{
|
|
113
|
-
template_root_ = minja::Parser::parse(source_, {
|
|
114
|
-
/* .trim_blocks = */ true,
|
|
115
|
-
/* .lstrip_blocks = */ true,
|
|
116
|
-
/* .keep_trailing_newline = */ false,
|
|
117
|
-
});
|
|
118
|
-
|
|
119
|
-
auto contains = [](const std::string & haystack, const std::string & needle) {
|
|
120
|
-
return haystack.find(needle) != std::string::npos;
|
|
121
|
-
};
|
|
122
|
-
|
|
123
|
-
const std::string user_needle = "<User Needle>";
|
|
124
|
-
const std::string sys_needle = "<System Needle>";
|
|
125
|
-
const json dummy_str_user_msg = {{"role", "user"}, {"content", user_needle}};
|
|
126
|
-
const json dummy_typed_user_msg = {{"role", "user"}, {"content", json::array({{{"type", "text"}, {"text", user_needle}}})}};
|
|
127
|
-
|
|
128
|
-
caps_.requires_typed_content =
|
|
129
|
-
!contains(try_raw_render(json::array({dummy_str_user_msg}), {}, false), user_needle)
|
|
130
|
-
&& contains(try_raw_render(json::array({dummy_typed_user_msg}), {}, false), user_needle);
|
|
131
|
-
|
|
132
|
-
const auto dummy_user_msg = caps_.requires_typed_content
|
|
133
|
-
? dummy_typed_user_msg
|
|
134
|
-
: dummy_str_user_msg;
|
|
135
|
-
const json needle_system_msg = {
|
|
136
|
-
{"role", "system"},
|
|
137
|
-
{"content", caps_.requires_typed_content ? json::array({{{"type", "text"}, {"text", sys_needle}}}) : json(sys_needle)},
|
|
138
|
-
};
|
|
139
|
-
|
|
140
|
-
caps_.supports_system_role = contains(try_raw_render({needle_system_msg, dummy_user_msg,}, {}, false), sys_needle);
|
|
141
|
-
|
|
142
|
-
auto out = try_raw_render(json::array({
|
|
143
|
-
dummy_user_msg
|
|
144
|
-
}), json::array({
|
|
145
|
-
{
|
|
146
|
-
{"name", "some_tool"},
|
|
147
|
-
{"type", "function"},
|
|
148
|
-
{"function", {
|
|
149
|
-
{"name", "some_tool"},
|
|
150
|
-
{"description", "Some tool."},
|
|
151
|
-
{"parameters", {
|
|
152
|
-
{"type", "object"},
|
|
153
|
-
{"properties", {
|
|
154
|
-
{"arg", {
|
|
155
|
-
{"type", "string"},
|
|
156
|
-
{"description", "Some argument."},
|
|
157
|
-
}},
|
|
158
|
-
}},
|
|
159
|
-
{"required", json::array({ "arg" })},
|
|
160
|
-
}},
|
|
161
|
-
}},
|
|
162
|
-
},
|
|
163
|
-
}), false);
|
|
164
|
-
caps_.supports_tools = contains(out, "some_tool");
|
|
165
|
-
|
|
166
|
-
auto make_tool_calls_msg = [&](const json & tool_calls) {
|
|
167
|
-
return json {
|
|
168
|
-
{"role", "assistant"},
|
|
169
|
-
{"content", nullptr},
|
|
170
|
-
{"tool_calls", tool_calls},
|
|
171
|
-
};
|
|
172
|
-
};
|
|
173
|
-
auto make_tool_call = [](const std::string & tool_name, const json & arguments) {
|
|
174
|
-
return json {
|
|
175
|
-
{"id", "call_1___"},
|
|
176
|
-
{"type", "function"},
|
|
177
|
-
{"function", {
|
|
178
|
-
{"arguments", arguments},
|
|
179
|
-
{"name", tool_name},
|
|
180
|
-
}},
|
|
181
|
-
};
|
|
182
|
-
};
|
|
183
|
-
const json dummy_args_obj {{"argument_needle", "print('Hello, World!')"}};
|
|
184
|
-
|
|
185
|
-
// Note: the arguments are rendered in both cases, but may be double-escaped, which we don't want.
|
|
186
|
-
out = try_raw_render(json::array({
|
|
187
|
-
dummy_user_msg,
|
|
188
|
-
make_tool_calls_msg(json::array({make_tool_call("ipython", dummy_args_obj.dump())})),
|
|
189
|
-
}), {}, false);
|
|
190
|
-
auto tool_call_renders_str_arguments = contains(out, "\"argument_needle\":") || contains(out, "'argument_needle':");
|
|
191
|
-
out = try_raw_render(json::array({
|
|
192
|
-
dummy_user_msg,
|
|
193
|
-
make_tool_calls_msg(json::array({make_tool_call("ipython", dummy_args_obj)})),
|
|
194
|
-
}), {}, false);
|
|
195
|
-
auto tool_call_renders_obj_arguments = contains(out, "\"argument_needle\":") || contains(out, "'argument_needle':");
|
|
196
|
-
|
|
197
|
-
caps_.supports_tool_calls = tool_call_renders_str_arguments || tool_call_renders_obj_arguments;
|
|
198
|
-
caps_.requires_object_arguments = !tool_call_renders_str_arguments && tool_call_renders_obj_arguments;
|
|
199
|
-
auto out_empty = try_raw_render(json::array({dummy_user_msg, {{"role", "assistant"}, {"content", ""}}}), {}, false);
|
|
200
|
-
auto out_null = try_raw_render(json::array({dummy_user_msg, {{"role", "assistant"}, {"content", nullptr}}}), {}, false);
|
|
201
|
-
caps_.requires_non_null_content = contains(out_empty, user_needle) && !contains(out_null, user_needle);
|
|
202
|
-
|
|
203
|
-
if (caps_.supports_tool_calls) {
|
|
204
|
-
auto dummy_args = caps_.requires_object_arguments ? dummy_args_obj : json(dummy_args_obj.dump());
|
|
205
|
-
auto tc1 = make_tool_call("test_tool1", dummy_args);
|
|
206
|
-
auto tc2 = make_tool_call("test_tool2", dummy_args);
|
|
207
|
-
auto out = try_raw_render(json::array({
|
|
208
|
-
dummy_user_msg,
|
|
209
|
-
make_tool_calls_msg(json::array({tc1, tc2})),
|
|
210
|
-
}), {}, false);
|
|
211
|
-
caps_.supports_parallel_tool_calls = contains(out, "test_tool1") && contains(out, "test_tool2");
|
|
212
|
-
|
|
213
|
-
out = try_raw_render(json::array({
|
|
214
|
-
dummy_user_msg,
|
|
215
|
-
make_tool_calls_msg(json::array({tc1})),
|
|
216
|
-
{
|
|
217
|
-
{"role", "tool"},
|
|
218
|
-
{"name", "test_tool1"},
|
|
219
|
-
{"content", "Some response!"},
|
|
220
|
-
{"tool_call_id", "call_911_"},
|
|
221
|
-
}
|
|
222
|
-
}), {}, false);
|
|
223
|
-
caps_.supports_tool_responses = contains(out, "Some response!");
|
|
224
|
-
caps_.supports_tool_call_id = contains(out, "call_911_");
|
|
225
|
-
}
|
|
226
|
-
|
|
227
|
-
try {
|
|
228
|
-
if (!caps_.supports_tools) {
|
|
229
|
-
const json user_msg {
|
|
230
|
-
{"role", "user"},
|
|
231
|
-
{"content", "Hey"},
|
|
232
|
-
};
|
|
233
|
-
const json args {
|
|
234
|
-
{"arg1", "some_value"},
|
|
235
|
-
};
|
|
236
|
-
const json tool_call_msg {
|
|
237
|
-
{"role", "assistant"},
|
|
238
|
-
{"content", nullptr},
|
|
239
|
-
{"tool_calls", json::array({
|
|
240
|
-
{
|
|
241
|
-
// TODO: detect if requires numerical id or fixed length == 6 like Nemo
|
|
242
|
-
{"id", "call_1___"},
|
|
243
|
-
{"type", "function"},
|
|
244
|
-
{"function", {
|
|
245
|
-
{"name", "tool_name"},
|
|
246
|
-
{"arguments", (caps_.requires_object_arguments ? args : json(minja::Value(args).dump(-1, /* to_json= */ true)))},
|
|
247
|
-
}},
|
|
248
|
-
},
|
|
249
|
-
})},
|
|
250
|
-
};
|
|
251
|
-
std::string prefix, full;
|
|
252
|
-
{
|
|
253
|
-
chat_template_inputs inputs;
|
|
254
|
-
inputs.messages = json::array({user_msg});
|
|
255
|
-
inputs.add_generation_prompt = true;
|
|
256
|
-
prefix = apply(inputs);
|
|
257
|
-
}
|
|
258
|
-
{
|
|
259
|
-
chat_template_inputs inputs;
|
|
260
|
-
inputs.messages = json::array({user_msg, tool_call_msg});
|
|
261
|
-
inputs.add_generation_prompt = false;
|
|
262
|
-
full = apply(inputs);
|
|
263
|
-
}
|
|
264
|
-
auto eos_pos_last = full.rfind(eos_token_);
|
|
265
|
-
if (eos_pos_last == prefix.size() - eos_token_.size() ||
|
|
266
|
-
(full[full.size() - 1] == '\n' && (eos_pos_last == full.size() - eos_token_.size() - 1))) {
|
|
267
|
-
full = full.substr(0, eos_pos_last);
|
|
268
|
-
}
|
|
269
|
-
size_t common_prefix_length = 0;
|
|
270
|
-
for (size_t i = 0; i < prefix.size() && i < full.size(); ++i) {
|
|
271
|
-
if (prefix[i] != full[i]) {
|
|
272
|
-
break;
|
|
273
|
-
}
|
|
274
|
-
if (prefix[i] == '<') {
|
|
275
|
-
// DeepSeek R1's template (as of 20250209) adds a trailing <think> if add_generation_prompt,
|
|
276
|
-
// but it removes thinking tags for past messages.
|
|
277
|
-
// The prefix and full strings diverge at <think> vs. <|tool▁calls▁begin|>, we avoid consuming the leading <.
|
|
278
|
-
continue;
|
|
279
|
-
}
|
|
280
|
-
common_prefix_length = i + 1;
|
|
281
|
-
}
|
|
282
|
-
auto example = full.substr(common_prefix_length);
|
|
283
|
-
if (example.find("tool_name") == std::string::npos && example.find("some_value") == std::string::npos) {
|
|
284
|
-
fprintf(stderr, "Failed to infer a tool call example (possible template bug)\n");
|
|
285
|
-
} else {
|
|
286
|
-
tool_call_example_ = example;
|
|
287
|
-
}
|
|
288
|
-
}
|
|
289
|
-
} catch (const std::exception & e) {
|
|
290
|
-
fprintf(stderr, "Failed to generate tool call example: %s\n", e.what());
|
|
291
|
-
}
|
|
292
|
-
}
|
|
293
|
-
|
|
294
|
-
const std::string & source() const { return source_; }
|
|
295
|
-
const std::string & bos_token() const { return bos_token_; }
|
|
296
|
-
const std::string & eos_token() const { return eos_token_; }
|
|
297
|
-
const chat_template_caps & original_caps() const { return caps_; }
|
|
298
|
-
|
|
299
|
-
// Deprecated, please use the form with chat_template_inputs and chat_template_options
|
|
300
|
-
std::string apply(
|
|
301
|
-
const nlohmann::ordered_json & messages,
|
|
302
|
-
const nlohmann::ordered_json & tools,
|
|
303
|
-
bool add_generation_prompt,
|
|
304
|
-
const nlohmann::ordered_json & extra_context = nlohmann::ordered_json(),
|
|
305
|
-
bool apply_polyfills = true)
|
|
306
|
-
{
|
|
307
|
-
fprintf(stderr, "[%s] Deprecated!\n", __func__);
|
|
308
|
-
chat_template_inputs inputs;
|
|
309
|
-
inputs.messages = messages;
|
|
310
|
-
inputs.tools = tools;
|
|
311
|
-
inputs.add_generation_prompt = add_generation_prompt;
|
|
312
|
-
inputs.extra_context = extra_context;
|
|
313
|
-
inputs.now = std::chrono::system_clock::now();
|
|
314
|
-
|
|
315
|
-
chat_template_options opts;
|
|
316
|
-
opts.apply_polyfills = apply_polyfills;
|
|
317
|
-
|
|
318
|
-
return apply(inputs, opts);
|
|
319
|
-
}
|
|
320
|
-
|
|
321
|
-
std::string apply(
|
|
322
|
-
const chat_template_inputs & inputs,
|
|
323
|
-
const chat_template_options & opts = chat_template_options()) const
|
|
324
|
-
{
|
|
325
|
-
json actual_messages;
|
|
326
|
-
|
|
327
|
-
auto has_tools = inputs.tools.is_array() && !inputs.tools.empty();
|
|
328
|
-
auto has_tool_calls = false;
|
|
329
|
-
auto has_tool_responses = false;
|
|
330
|
-
auto has_string_content = false;
|
|
331
|
-
for (const auto & message : inputs.messages) {
|
|
332
|
-
if (message.contains("tool_calls") && !message["tool_calls"].is_null()) {
|
|
333
|
-
has_tool_calls = true;
|
|
334
|
-
}
|
|
335
|
-
if (message.contains("role") && message["role"] == "tool") {
|
|
336
|
-
has_tool_responses = true;
|
|
337
|
-
}
|
|
338
|
-
if (message.contains("content") && message["content"].is_string()) {
|
|
339
|
-
has_string_content = true;
|
|
340
|
-
}
|
|
341
|
-
}
|
|
342
|
-
|
|
343
|
-
auto polyfill_system_role = opts.polyfill_system_role && !caps_.supports_system_role;
|
|
344
|
-
auto polyfill_tools = opts.polyfill_tools && has_tools && !caps_.supports_tools;
|
|
345
|
-
auto polyfill_tool_call_example = polyfill_tools && opts.polyfill_tool_call_examples;
|
|
346
|
-
auto polyfill_tool_calls = opts.polyfill_tool_calls && has_tool_calls && !caps_.supports_tool_calls;
|
|
347
|
-
auto polyfill_tool_responses = opts.polyfill_tool_responses && has_tool_responses && !caps_.supports_tool_responses;
|
|
348
|
-
auto polyfill_object_arguments = opts.polyfill_object_arguments && has_tool_calls && caps_.requires_object_arguments;
|
|
349
|
-
auto polyfill_typed_content = opts.polyfill_typed_content && has_string_content && caps_.requires_typed_content;
|
|
350
|
-
|
|
351
|
-
auto needs_polyfills = opts.apply_polyfills && (false
|
|
352
|
-
|| polyfill_system_role
|
|
353
|
-
|| polyfill_tools
|
|
354
|
-
|| polyfill_tool_calls
|
|
355
|
-
|| polyfill_tool_responses
|
|
356
|
-
|| polyfill_object_arguments
|
|
357
|
-
|| polyfill_typed_content
|
|
358
|
-
);
|
|
359
|
-
|
|
360
|
-
if (needs_polyfills) {
|
|
361
|
-
actual_messages = json::array();
|
|
362
|
-
|
|
363
|
-
auto add_message = [&](const json & msg) {
|
|
364
|
-
if (polyfill_typed_content && msg.contains("content") && !msg.at("content").is_null() && msg.at("content").is_string()) {
|
|
365
|
-
actual_messages.push_back({
|
|
366
|
-
{"role", msg.at("role")},
|
|
367
|
-
{"content", {{
|
|
368
|
-
{"type", "text"},
|
|
369
|
-
{"text", msg.at("content")},
|
|
370
|
-
}}},
|
|
371
|
-
});
|
|
372
|
-
} else {
|
|
373
|
-
actual_messages.push_back(msg);
|
|
374
|
-
}
|
|
375
|
-
};
|
|
376
|
-
|
|
377
|
-
std::string pending_system;
|
|
378
|
-
auto flush_sys = [&]() {
|
|
379
|
-
if (!pending_system.empty()) {
|
|
380
|
-
add_message({
|
|
381
|
-
{"role", "user"},
|
|
382
|
-
{"content", pending_system},
|
|
383
|
-
});
|
|
384
|
-
pending_system.clear();
|
|
385
|
-
}
|
|
386
|
-
};
|
|
387
|
-
|
|
388
|
-
json adjusted_messages;
|
|
389
|
-
if (polyfill_tools) {
|
|
390
|
-
adjusted_messages = add_system(inputs.messages,
|
|
391
|
-
"You can call any of the following tools to satisfy the user's requests: " + minja::Value(inputs.tools).dump(2, /* to_json= */ true) +
|
|
392
|
-
(!polyfill_tool_call_example || tool_call_example_.empty() ? "" : "\n\nExample tool call syntax:\n\n" + tool_call_example_ + "\n\n"));
|
|
393
|
-
} else {
|
|
394
|
-
adjusted_messages = inputs.messages;
|
|
395
|
-
}
|
|
396
|
-
|
|
397
|
-
for (const auto & message_ : adjusted_messages) {
|
|
398
|
-
auto message = message_;
|
|
399
|
-
if (!message.contains("role") || (!message.contains("content") && !message.contains("tool_calls"))) {
|
|
400
|
-
throw std::runtime_error("message must have 'role' and one of 'content' or 'tool_calls' fields: " + message.dump());
|
|
401
|
-
}
|
|
402
|
-
std::string role = message.at("role");
|
|
403
|
-
|
|
404
|
-
if (message.contains("tool_calls")) {
|
|
405
|
-
if (polyfill_object_arguments || polyfill_tool_calls) {
|
|
406
|
-
for (auto & tool_call : message.at("tool_calls")) {
|
|
407
|
-
if (tool_call["type"] == "function") {
|
|
408
|
-
auto & function = tool_call.at("function");
|
|
409
|
-
auto & arguments = function.at("arguments");
|
|
410
|
-
if (arguments.is_string()) {
|
|
411
|
-
try {
|
|
412
|
-
arguments = json::parse(arguments.get<std::string>());
|
|
413
|
-
} catch (const std::exception & ecvt) {
|
|
414
|
-
fprintf(stderr, "Failed to parse arguments: %s\n", ecvt.what());
|
|
415
|
-
}
|
|
416
|
-
}
|
|
417
|
-
}
|
|
418
|
-
}
|
|
419
|
-
}
|
|
420
|
-
if (polyfill_tool_calls) {
|
|
421
|
-
auto tool_calls = json::array();
|
|
422
|
-
for (const auto & tool_call : message.at("tool_calls")) {
|
|
423
|
-
if (tool_call.at("type") != "function") {
|
|
424
|
-
continue;
|
|
425
|
-
}
|
|
426
|
-
const auto & function = tool_call.at("function");
|
|
427
|
-
auto tc = json {
|
|
428
|
-
{"name", function.at("name")},
|
|
429
|
-
{"arguments", function.at("arguments")},
|
|
430
|
-
};
|
|
431
|
-
if (tool_call.contains("id")) {
|
|
432
|
-
tc["id"] = tool_call["id"];
|
|
433
|
-
}
|
|
434
|
-
tool_calls.push_back(tc);
|
|
435
|
-
}
|
|
436
|
-
auto obj = json {
|
|
437
|
-
{"tool_calls", tool_calls},
|
|
438
|
-
};
|
|
439
|
-
if (message.contains("content")) {
|
|
440
|
-
auto content = message.at("content");
|
|
441
|
-
if (!content.is_null() && !content.empty()) {
|
|
442
|
-
obj["content"] = content;
|
|
443
|
-
}
|
|
444
|
-
}
|
|
445
|
-
message["content"] = obj.dump(2);
|
|
446
|
-
message.erase("tool_calls");
|
|
447
|
-
}
|
|
448
|
-
}
|
|
449
|
-
if (polyfill_tool_responses && role == "tool") {
|
|
450
|
-
message["role"] = "user";
|
|
451
|
-
auto obj = json {
|
|
452
|
-
{"tool_response", json::object()},
|
|
453
|
-
};
|
|
454
|
-
if (message.contains("name")) {
|
|
455
|
-
obj["tool_response"]["tool"] = message.at("name");
|
|
456
|
-
}
|
|
457
|
-
obj["tool_response"]["content"] = message.at("content");
|
|
458
|
-
if (message.contains("tool_call_id")) {
|
|
459
|
-
obj["tool_response"]["tool_call_id"] = message.at("tool_call_id");
|
|
460
|
-
}
|
|
461
|
-
message["content"] = obj.dump(2);
|
|
462
|
-
message.erase("name");
|
|
463
|
-
}
|
|
464
|
-
|
|
465
|
-
if (!message["content"].is_null() && polyfill_system_role) {
|
|
466
|
-
std::string content = message.at("content");
|
|
467
|
-
if (role == "system") {
|
|
468
|
-
if (!pending_system.empty()) pending_system += "\n";
|
|
469
|
-
pending_system += content;
|
|
470
|
-
continue;
|
|
471
|
-
} else {
|
|
472
|
-
if (role == "user") {
|
|
473
|
-
if (!pending_system.empty()) {
|
|
474
|
-
message["content"] = pending_system + (content.empty() ? "" : "\n" + content);
|
|
475
|
-
pending_system.clear();
|
|
476
|
-
}
|
|
477
|
-
} else {
|
|
478
|
-
flush_sys();
|
|
479
|
-
}
|
|
480
|
-
}
|
|
481
|
-
}
|
|
482
|
-
add_message(message);
|
|
483
|
-
}
|
|
484
|
-
flush_sys();
|
|
485
|
-
} else {
|
|
486
|
-
actual_messages = inputs.messages;
|
|
487
|
-
}
|
|
488
|
-
|
|
489
|
-
auto context = minja::Context::make(json({
|
|
490
|
-
{"messages", actual_messages},
|
|
491
|
-
{"add_generation_prompt", inputs.add_generation_prompt},
|
|
492
|
-
}));
|
|
493
|
-
context->set("bos_token", opts.use_bos_token ? bos_token_ : "");
|
|
494
|
-
context->set("eos_token", opts.use_eos_token ? eos_token_ : "");
|
|
495
|
-
if (opts.define_strftime_now) {
|
|
496
|
-
auto now = inputs.now;
|
|
497
|
-
context->set("strftime_now", Value::callable([now](const std::shared_ptr<minja::Context> &, minja::ArgumentsValue & args) {
|
|
498
|
-
args.expectArgs("strftime_now", {1, 1}, {0, 0});
|
|
499
|
-
auto format = args.args[0].get<std::string>();
|
|
500
|
-
|
|
501
|
-
auto time = std::chrono::system_clock::to_time_t(now);
|
|
502
|
-
auto local_time = *std::localtime(&time);
|
|
503
|
-
std::ostringstream ss;
|
|
504
|
-
ss << std::put_time(&local_time, format.c_str());
|
|
505
|
-
return ss.str();
|
|
506
|
-
}));
|
|
507
|
-
}
|
|
508
|
-
if (!inputs.tools.is_null()) {
|
|
509
|
-
context->set("tools", minja::Value(inputs.tools));
|
|
510
|
-
}
|
|
511
|
-
if (!inputs.extra_context.is_null()) {
|
|
512
|
-
for (auto & kv : inputs.extra_context.items()) {
|
|
513
|
-
context->set(kv.key(), minja::Value(kv.value()));
|
|
514
|
-
}
|
|
515
|
-
}
|
|
516
|
-
|
|
517
|
-
auto ret = template_root_->render(context);
|
|
518
|
-
// fprintf(stderr, "actual_messages: %s\n", actual_messages.dump(2).c_str());
|
|
519
|
-
// fprintf(stderr, "apply: %s\n\n", ret.c_str());
|
|
520
|
-
return ret;
|
|
521
|
-
}
|
|
522
|
-
|
|
523
|
-
static nlohmann::ordered_json add_system(const nlohmann::ordered_json & messages, const std::string & system_prompt) {
|
|
524
|
-
json messages_with_system = messages;
|
|
525
|
-
|
|
526
|
-
if (!messages_with_system.empty() && messages_with_system[0].at("role") == "system") {
|
|
527
|
-
std::string existing_system = messages_with_system.at(0).at("content");
|
|
528
|
-
messages_with_system[0] = json {
|
|
529
|
-
{"role", "system"},
|
|
530
|
-
{"content", existing_system + "\n\n" + system_prompt},
|
|
531
|
-
};
|
|
532
|
-
} else {
|
|
533
|
-
messages_with_system.insert(messages_with_system.begin(), json {
|
|
534
|
-
{"role", "system"},
|
|
535
|
-
{"content", system_prompt},
|
|
536
|
-
});
|
|
537
|
-
}
|
|
538
|
-
return messages_with_system;
|
|
539
|
-
}
|
|
540
|
-
};
|
|
541
|
-
|
|
542
|
-
} // namespace minja
|