cactus-react-native 1.2.0 → 1.4.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +573 -13
- package/android/CMakeLists.txt +4 -3
- package/android/src/main/java/com/margelo/nitro/cactus/HybridCactusFileSystem.kt +21 -4
- package/android/src/main/jniLibs/arm64-v8a/libcactus.a +0 -0
- package/android/src/main/jniLibs/arm64-v8a/libcactus_util.a +0 -0
- package/cpp/HybridCactus.cpp +112 -19
- package/cpp/HybridCactus.hpp +12 -3
- package/cpp/HybridCactusIndex.cpp +325 -0
- package/cpp/HybridCactusIndex.hpp +43 -0
- package/cpp/HybridCactusUtil.cpp +3 -3
- package/cpp/HybridCactusUtil.hpp +2 -1
- package/cpp/cactus_ffi.h +83 -2
- package/cpp/cactus_util.h +1 -1
- package/ios/HybridCactusFileSystem.swift +23 -2
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/cactus.h +2 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/cactus_ffi.h +83 -2
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/cactus_telemetry.h +656 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/{ffi_utils.h → cactus_utils.h} +104 -17
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/engine.h +117 -7
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/graph.h +91 -5
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Headers/kernel.h +15 -6
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/Info.plist +0 -0
- package/ios/cactus.xcframework/ios-arm64/cactus.framework/cactus +0 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/cactus.h +2 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/cactus_ffi.h +83 -2
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/cactus_telemetry.h +656 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/{ffi_utils.h → cactus_utils.h} +104 -17
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/engine.h +117 -7
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/graph.h +91 -5
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Headers/kernel.h +15 -6
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/Info.plist +0 -0
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/_CodeSignature/CodeResources +1 -1
- package/ios/cactus.xcframework/ios-arm64-simulator/cactus.framework/cactus +0 -0
- package/ios/cactus_util.xcframework/Info.plist +4 -4
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/cactus_util.h +1 -1
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Headers/database.h +27 -0
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/Info.plist +0 -0
- package/ios/cactus_util.xcframework/ios-arm64/cactus_util.framework/cactus_util +0 -0
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/cactus_util.h +1 -1
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Headers/database.h +27 -0
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/Info.plist +0 -0
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/_CodeSignature/CodeResources +3 -3
- package/ios/cactus_util.xcframework/ios-arm64-simulator/cactus_util.framework/cactus_util +0 -0
- package/lib/module/api/Database.js +57 -3
- package/lib/module/api/Database.js.map +1 -1
- package/lib/module/classes/CactusIndex.js +45 -0
- package/lib/module/classes/CactusIndex.js.map +1 -0
- package/lib/module/classes/CactusLM.js +35 -10
- package/lib/module/classes/CactusLM.js.map +1 -1
- package/lib/module/classes/CactusSTT.js +20 -12
- package/lib/module/classes/CactusSTT.js.map +1 -1
- package/lib/module/config/CactusConfig.js +2 -0
- package/lib/module/config/CactusConfig.js.map +1 -1
- package/lib/module/constants/packageVersion.js +1 -1
- package/lib/module/hooks/useCactusIndex.js +175 -0
- package/lib/module/hooks/useCactusIndex.js.map +1 -0
- package/lib/module/hooks/useCactusLM.js +54 -2
- package/lib/module/hooks/useCactusLM.js.map +1 -1
- package/lib/module/hooks/useCactusSTT.js +2 -2
- package/lib/module/hooks/useCactusSTT.js.map +1 -1
- package/lib/module/index.js +2 -0
- package/lib/module/index.js.map +1 -1
- package/lib/module/native/Cactus.js +21 -5
- package/lib/module/native/Cactus.js.map +1 -1
- package/lib/module/native/CactusFileSystem.js +3 -0
- package/lib/module/native/CactusFileSystem.js.map +1 -1
- package/lib/module/native/CactusIndex.js +32 -0
- package/lib/module/native/CactusIndex.js.map +1 -0
- package/lib/module/native/CactusUtil.js +16 -3
- package/lib/module/native/CactusUtil.js.map +1 -1
- package/lib/module/native/index.js +1 -0
- package/lib/module/native/index.js.map +1 -1
- package/lib/module/specs/CactusIndex.nitro.js +4 -0
- package/lib/module/specs/CactusIndex.nitro.js.map +1 -0
- package/lib/module/telemetry/Telemetry.js +3 -1
- package/lib/module/telemetry/Telemetry.js.map +1 -1
- package/lib/module/types/CactusIndex.js +2 -0
- package/lib/module/types/CactusIndex.js.map +1 -0
- package/lib/module/types/CactusSTTModel.js +2 -0
- package/lib/module/types/CactusSTTModel.js.map +1 -0
- package/lib/typescript/src/api/Database.d.ts +7 -1
- package/lib/typescript/src/api/Database.d.ts.map +1 -1
- package/lib/typescript/src/classes/CactusIndex.d.ts +15 -0
- package/lib/typescript/src/classes/CactusIndex.d.ts.map +1 -0
- package/lib/typescript/src/classes/CactusLM.d.ts +5 -3
- package/lib/typescript/src/classes/CactusLM.d.ts.map +1 -1
- package/lib/typescript/src/classes/CactusSTT.d.ts +4 -4
- package/lib/typescript/src/classes/CactusSTT.d.ts.map +1 -1
- package/lib/typescript/src/config/CactusConfig.d.ts +1 -0
- package/lib/typescript/src/config/CactusConfig.d.ts.map +1 -1
- package/lib/typescript/src/constants/packageVersion.d.ts +1 -1
- package/lib/typescript/src/hooks/useCactusIndex.d.ts +14 -0
- package/lib/typescript/src/hooks/useCactusIndex.d.ts.map +1 -0
- package/lib/typescript/src/hooks/useCactusLM.d.ts +4 -2
- package/lib/typescript/src/hooks/useCactusLM.d.ts.map +1 -1
- package/lib/typescript/src/hooks/useCactusSTT.d.ts +3 -3
- package/lib/typescript/src/hooks/useCactusSTT.d.ts.map +1 -1
- package/lib/typescript/src/index.d.ts +5 -1
- package/lib/typescript/src/index.d.ts.map +1 -1
- package/lib/typescript/src/native/Cactus.d.ts +4 -2
- package/lib/typescript/src/native/Cactus.d.ts.map +1 -1
- package/lib/typescript/src/native/CactusFileSystem.d.ts +1 -0
- package/lib/typescript/src/native/CactusFileSystem.d.ts.map +1 -1
- package/lib/typescript/src/native/CactusIndex.d.ts +12 -0
- package/lib/typescript/src/native/CactusIndex.d.ts.map +1 -0
- package/lib/typescript/src/native/CactusUtil.d.ts.map +1 -1
- package/lib/typescript/src/native/index.d.ts +1 -0
- package/lib/typescript/src/native/index.d.ts.map +1 -1
- package/lib/typescript/src/specs/Cactus.nitro.d.ts +4 -2
- package/lib/typescript/src/specs/Cactus.nitro.d.ts.map +1 -1
- package/lib/typescript/src/specs/CactusFileSystem.nitro.d.ts +1 -0
- package/lib/typescript/src/specs/CactusFileSystem.nitro.d.ts.map +1 -1
- package/lib/typescript/src/specs/CactusIndex.nitro.d.ts +24 -0
- package/lib/typescript/src/specs/CactusIndex.nitro.d.ts.map +1 -0
- package/lib/typescript/src/specs/CactusUtil.nitro.d.ts +1 -1
- package/lib/typescript/src/specs/CactusUtil.nitro.d.ts.map +1 -1
- package/lib/typescript/src/types/CactusIndex.d.ts +34 -0
- package/lib/typescript/src/types/CactusIndex.d.ts.map +1 -0
- package/lib/typescript/src/types/CactusLM.d.ts +17 -0
- package/lib/typescript/src/types/CactusLM.d.ts.map +1 -1
- package/lib/typescript/src/types/CactusModel.d.ts +1 -0
- package/lib/typescript/src/types/CactusModel.d.ts.map +1 -1
- package/lib/typescript/src/types/CactusSTT.d.ts +1 -1
- package/lib/typescript/src/types/CactusSTT.d.ts.map +1 -1
- package/lib/typescript/src/types/CactusSTTModel.d.ts +8 -0
- package/lib/typescript/src/types/CactusSTTModel.d.ts.map +1 -0
- package/nitro.json +3 -0
- package/nitrogen/generated/android/c++/JDeviceInfo.hpp +1 -1
- package/nitrogen/generated/android/c++/JFunc_void_double.hpp +1 -1
- package/nitrogen/generated/android/c++/JHybridCactusCryptoSpec.cpp +1 -1
- package/nitrogen/generated/android/c++/JHybridCactusCryptoSpec.hpp +1 -1
- package/nitrogen/generated/android/c++/JHybridCactusDeviceInfoSpec.cpp +1 -1
- package/nitrogen/generated/android/c++/JHybridCactusDeviceInfoSpec.hpp +1 -1
- package/nitrogen/generated/android/c++/JHybridCactusFileSystemSpec.cpp +17 -1
- package/nitrogen/generated/android/c++/JHybridCactusFileSystemSpec.hpp +2 -1
- package/nitrogen/generated/android/c++/JHybridCactusImageSpec.cpp +1 -1
- package/nitrogen/generated/android/c++/JHybridCactusImageSpec.hpp +1 -1
- package/nitrogen/generated/android/cactus+autolinking.cmake +2 -1
- package/nitrogen/generated/android/cactus+autolinking.gradle +1 -1
- package/nitrogen/generated/android/cactusOnLoad.cpp +11 -1
- package/nitrogen/generated/android/cactusOnLoad.hpp +1 -1
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/DeviceInfo.kt +1 -1
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/Func_void_double.kt +1 -1
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusCryptoSpec.kt +1 -1
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusDeviceInfoSpec.kt +1 -1
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusFileSystemSpec.kt +5 -1
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/HybridCactusImageSpec.kt +1 -1
- package/nitrogen/generated/android/kotlin/com/margelo/nitro/cactus/cactusOnLoad.kt +1 -1
- package/nitrogen/generated/ios/Cactus+autolinking.rb +1 -1
- package/nitrogen/generated/ios/Cactus-Swift-Cxx-Bridge.cpp +1 -1
- package/nitrogen/generated/ios/Cactus-Swift-Cxx-Bridge.hpp +1 -1
- package/nitrogen/generated/ios/Cactus-Swift-Cxx-Umbrella.hpp +1 -1
- package/nitrogen/generated/ios/CactusAutolinking.mm +11 -1
- package/nitrogen/generated/ios/CactusAutolinking.swift +1 -1
- package/nitrogen/generated/ios/c++/HybridCactusCryptoSpecSwift.cpp +1 -1
- package/nitrogen/generated/ios/c++/HybridCactusCryptoSpecSwift.hpp +1 -1
- package/nitrogen/generated/ios/c++/HybridCactusDeviceInfoSpecSwift.cpp +1 -1
- package/nitrogen/generated/ios/c++/HybridCactusDeviceInfoSpecSwift.hpp +1 -1
- package/nitrogen/generated/ios/c++/HybridCactusFileSystemSpecSwift.cpp +1 -1
- package/nitrogen/generated/ios/c++/HybridCactusFileSystemSpecSwift.hpp +9 -1
- package/nitrogen/generated/ios/c++/HybridCactusImageSpecSwift.cpp +1 -1
- package/nitrogen/generated/ios/c++/HybridCactusImageSpecSwift.hpp +1 -1
- package/nitrogen/generated/ios/swift/DeviceInfo.swift +1 -1
- package/nitrogen/generated/ios/swift/Func_void.swift +1 -1
- package/nitrogen/generated/ios/swift/Func_void_DeviceInfo.swift +1 -1
- package/nitrogen/generated/ios/swift/Func_void_bool.swift +1 -1
- package/nitrogen/generated/ios/swift/Func_void_double.swift +1 -1
- package/nitrogen/generated/ios/swift/Func_void_std__exception_ptr.swift +1 -1
- package/nitrogen/generated/ios/swift/Func_void_std__optional_std__string_.swift +1 -1
- package/nitrogen/generated/ios/swift/Func_void_std__string.swift +1 -1
- package/nitrogen/generated/ios/swift/HybridCactusCryptoSpec.swift +1 -1
- package/nitrogen/generated/ios/swift/HybridCactusCryptoSpec_cxx.swift +1 -1
- package/nitrogen/generated/ios/swift/HybridCactusDeviceInfoSpec.swift +1 -1
- package/nitrogen/generated/ios/swift/HybridCactusDeviceInfoSpec_cxx.swift +1 -1
- package/nitrogen/generated/ios/swift/HybridCactusFileSystemSpec.swift +2 -1
- package/nitrogen/generated/ios/swift/HybridCactusFileSystemSpec_cxx.swift +20 -1
- package/nitrogen/generated/ios/swift/HybridCactusImageSpec.swift +1 -1
- package/nitrogen/generated/ios/swift/HybridCactusImageSpec_cxx.swift +1 -1
- package/nitrogen/generated/shared/c++/CactusIndexGetResult.hpp +84 -0
- package/nitrogen/generated/shared/c++/CactusIndexQueryResult.hpp +79 -0
- package/nitrogen/generated/shared/c++/DeviceInfo.hpp +1 -1
- package/nitrogen/generated/shared/c++/HybridCactusCryptoSpec.cpp +1 -1
- package/nitrogen/generated/shared/c++/HybridCactusCryptoSpec.hpp +1 -1
- package/nitrogen/generated/shared/c++/HybridCactusDeviceInfoSpec.cpp +1 -1
- package/nitrogen/generated/shared/c++/HybridCactusDeviceInfoSpec.hpp +1 -1
- package/nitrogen/generated/shared/c++/HybridCactusFileSystemSpec.cpp +2 -1
- package/nitrogen/generated/shared/c++/HybridCactusFileSystemSpec.hpp +2 -1
- package/nitrogen/generated/shared/c++/HybridCactusImageSpec.cpp +1 -1
- package/nitrogen/generated/shared/c++/HybridCactusImageSpec.hpp +1 -1
- package/nitrogen/generated/shared/c++/HybridCactusIndexSpec.cpp +27 -0
- package/nitrogen/generated/shared/c++/HybridCactusIndexSpec.hpp +76 -0
- package/nitrogen/generated/shared/c++/HybridCactusSpec.cpp +3 -1
- package/nitrogen/generated/shared/c++/HybridCactusSpec.hpp +6 -3
- package/nitrogen/generated/shared/c++/HybridCactusUtilSpec.cpp +1 -1
- package/nitrogen/generated/shared/c++/HybridCactusUtilSpec.hpp +2 -2
- package/package.json +2 -2
- package/src/api/Database.ts +80 -2
- package/src/classes/CactusIndex.ts +58 -0
- package/src/classes/CactusLM.ts +41 -11
- package/src/classes/CactusSTT.ts +24 -16
- package/src/config/CactusConfig.ts +3 -0
- package/src/constants/packageVersion.ts +1 -1
- package/src/hooks/useCactusIndex.ts +195 -0
- package/src/hooks/useCactusLM.ts +63 -3
- package/src/hooks/useCactusSTT.ts +4 -4
- package/src/index.tsx +17 -0
- package/src/native/Cactus.ts +39 -4
- package/src/native/CactusFileSystem.ts +4 -0
- package/src/native/CactusIndex.ts +54 -0
- package/src/native/CactusUtil.ts +19 -3
- package/src/native/index.ts +1 -0
- package/src/specs/Cactus.nitro.ts +13 -2
- package/src/specs/CactusFileSystem.nitro.ts +2 -0
- package/src/specs/CactusIndex.nitro.ts +31 -0
- package/src/specs/CactusUtil.nitro.ts +1 -1
- package/src/telemetry/Telemetry.ts +1 -1
- package/src/types/CactusIndex.ts +40 -0
- package/src/types/CactusLM.ts +21 -0
- package/src/types/CactusModel.ts +1 -0
- package/src/types/CactusSTT.ts +1 -1
- package/src/types/CactusSTTModel.ts +10 -0
- package/android/src/main/jniLibs/arm64-v8a/libcactus_util.so +0 -0
package/android/CMakeLists.txt
CHANGED
|
@@ -6,10 +6,11 @@ set(CMAKE_VERBOSE_MAKEFILE ON)
|
|
|
6
6
|
set(CMAKE_CXX_STANDARD 20)
|
|
7
7
|
|
|
8
8
|
# Define C++ library and add all sources
|
|
9
|
-
add_library(${PACKAGE_NAME} SHARED
|
|
9
|
+
add_library(${PACKAGE_NAME} SHARED
|
|
10
10
|
src/main/cpp/cpp-adapter.cpp
|
|
11
11
|
../cpp/HybridCactus.cpp
|
|
12
12
|
../cpp/HybridCactusUtil.cpp
|
|
13
|
+
../cpp/HybridCactusIndex.cpp
|
|
13
14
|
)
|
|
14
15
|
|
|
15
16
|
add_library(libcactus STATIC IMPORTED)
|
|
@@ -17,9 +18,9 @@ set_target_properties(libcactus PROPERTIES
|
|
|
17
18
|
IMPORTED_LOCATION "${CMAKE_CURRENT_LIST_DIR}/src/main/jniLibs/${ANDROID_ABI}/libcactus.a"
|
|
18
19
|
)
|
|
19
20
|
|
|
20
|
-
add_library(libcactus_util
|
|
21
|
+
add_library(libcactus_util STATIC IMPORTED)
|
|
21
22
|
set_target_properties(libcactus_util PROPERTIES
|
|
22
|
-
IMPORTED_LOCATION "${CMAKE_CURRENT_LIST_DIR}/src/main/jniLibs/${ANDROID_ABI}/libcactus_util.
|
|
23
|
+
IMPORTED_LOCATION "${CMAKE_CURRENT_LIST_DIR}/src/main/jniLibs/${ANDROID_ABI}/libcactus_util.a"
|
|
23
24
|
)
|
|
24
25
|
|
|
25
26
|
# Add Nitrogen specs :)
|
|
@@ -209,10 +209,10 @@ class HybridCactusFileSystem : HybridCactusFileSystemSpec() {
|
|
|
209
209
|
modelFile.deleteRecursively()
|
|
210
210
|
}
|
|
211
211
|
|
|
212
|
+
override fun getIndexPath(name: String): Promise<String> = Promise.async { indexFile(name).absolutePath }
|
|
213
|
+
|
|
212
214
|
private fun cactusFile(): File {
|
|
213
|
-
val
|
|
214
|
-
context.getExternalFilesDir(android.os.Environment.DIRECTORY_DOCUMENTS) ?: context.filesDir
|
|
215
|
-
val cactusDir = File(documentsDir, "cactus")
|
|
215
|
+
val cactusDir = File(context.filesDir, "cactus")
|
|
216
216
|
|
|
217
217
|
if (!cactusDir.exists()) {
|
|
218
218
|
cactusDir.mkdirs()
|
|
@@ -223,6 +223,23 @@ class HybridCactusFileSystem : HybridCactusFileSystemSpec() {
|
|
|
223
223
|
|
|
224
224
|
private fun modelFile(model: String): File {
|
|
225
225
|
val cactusDir = cactusFile()
|
|
226
|
-
|
|
226
|
+
val modelsDir = File(cactusDir, "models")
|
|
227
|
+
|
|
228
|
+
if (!modelsDir.exists()) {
|
|
229
|
+
modelsDir.mkdirs()
|
|
230
|
+
}
|
|
231
|
+
|
|
232
|
+
return File(modelsDir, model)
|
|
233
|
+
}
|
|
234
|
+
|
|
235
|
+
private fun indexFile(name: String): File {
|
|
236
|
+
val cactusDir = cactusFile()
|
|
237
|
+
val finalDir = File(cactusDir, "indexes/$name")
|
|
238
|
+
|
|
239
|
+
if (!finalDir.exists()) {
|
|
240
|
+
finalDir.mkdirs()
|
|
241
|
+
}
|
|
242
|
+
|
|
243
|
+
return finalDir
|
|
227
244
|
}
|
|
228
245
|
}
|
|
Binary file
|
|
Binary file
|
package/cpp/HybridCactus.cpp
CHANGED
|
@@ -1,6 +1,7 @@
|
|
|
1
1
|
#include "HybridCactus.hpp"
|
|
2
2
|
|
|
3
3
|
namespace margelo::nitro::cactus {
|
|
4
|
+
|
|
4
5
|
HybridCactus::HybridCactus() : HybridObject(TAG) {}
|
|
5
6
|
|
|
6
7
|
std::shared_ptr<Promise<void>>
|
|
@@ -19,7 +20,8 @@ HybridCactus::init(const std::string &modelPath, double contextSize,
|
|
|
19
20
|
corpusDir ? corpusDir->c_str() : nullptr);
|
|
20
21
|
|
|
21
22
|
if (!model) {
|
|
22
|
-
throw std::runtime_error("
|
|
23
|
+
throw std::runtime_error("Cactus init failed: " +
|
|
24
|
+
std::string(cactus_get_last_error()));
|
|
23
25
|
}
|
|
24
26
|
|
|
25
27
|
this->_model = model;
|
|
@@ -65,7 +67,8 @@ std::shared_ptr<Promise<std::string>> HybridCactus::complete(
|
|
|
65
67
|
cactusTokenCallback, &callbackCtx);
|
|
66
68
|
|
|
67
69
|
if (result < 0) {
|
|
68
|
-
throw std::runtime_error("Cactus
|
|
70
|
+
throw std::runtime_error("Cactus complete failed: " +
|
|
71
|
+
std::string(cactus_get_last_error()));
|
|
69
72
|
}
|
|
70
73
|
|
|
71
74
|
// Remove null terminator
|
|
@@ -75,12 +78,78 @@ std::shared_ptr<Promise<std::string>> HybridCactus::complete(
|
|
|
75
78
|
});
|
|
76
79
|
}
|
|
77
80
|
|
|
81
|
+
std::shared_ptr<Promise<std::vector<double>>>
|
|
82
|
+
HybridCactus::tokenize(const std::string &text) {
|
|
83
|
+
return Promise<std::vector<double>>::async([this,
|
|
84
|
+
text]() -> std::vector<double> {
|
|
85
|
+
std::lock_guard<std::mutex> lock(this->_modelMutex);
|
|
86
|
+
|
|
87
|
+
if (!this->_model) {
|
|
88
|
+
throw std::runtime_error("Cactus model is not initialized");
|
|
89
|
+
}
|
|
90
|
+
|
|
91
|
+
std::vector<uint32_t> tokenBuffer(text.length() * 2 + 16);
|
|
92
|
+
size_t outTokenLen = 0;
|
|
93
|
+
|
|
94
|
+
int result = cactus_tokenize(this->_model, text.c_str(), tokenBuffer.data(),
|
|
95
|
+
tokenBuffer.size(), &outTokenLen);
|
|
96
|
+
|
|
97
|
+
if (result < 0) {
|
|
98
|
+
throw std::runtime_error("Cactus tokenize failed: " +
|
|
99
|
+
std::string(cactus_get_last_error()));
|
|
100
|
+
}
|
|
101
|
+
|
|
102
|
+
tokenBuffer.resize(outTokenLen);
|
|
103
|
+
|
|
104
|
+
return std::vector<double>(tokenBuffer.begin(), tokenBuffer.end());
|
|
105
|
+
});
|
|
106
|
+
}
|
|
107
|
+
|
|
108
|
+
std::shared_ptr<Promise<std::string>>
|
|
109
|
+
HybridCactus::scoreWindow(const std::vector<double> &tokens, double start,
|
|
110
|
+
double end, double context) {
|
|
111
|
+
return Promise<std::string>::async(
|
|
112
|
+
[this, tokens, start, end, context]() -> std::string {
|
|
113
|
+
std::lock_guard<std::mutex> lock(this->_modelMutex);
|
|
114
|
+
|
|
115
|
+
if (!this->_model) {
|
|
116
|
+
throw std::runtime_error("Cactus model is not initialized");
|
|
117
|
+
}
|
|
118
|
+
|
|
119
|
+
std::vector<uint32_t> tokenBuffer;
|
|
120
|
+
tokenBuffer.reserve(tokens.size());
|
|
121
|
+
for (double d : tokens) {
|
|
122
|
+
tokenBuffer.emplace_back(static_cast<uint32_t>(d));
|
|
123
|
+
}
|
|
124
|
+
|
|
125
|
+
std::string responseBuffer;
|
|
126
|
+
responseBuffer.resize(1024);
|
|
127
|
+
|
|
128
|
+
int result = cactus_score_window(
|
|
129
|
+
this->_model, tokenBuffer.data(), tokenBuffer.size(),
|
|
130
|
+
static_cast<size_t>(start), static_cast<size_t>(end),
|
|
131
|
+
static_cast<size_t>(context), responseBuffer.data(),
|
|
132
|
+
responseBuffer.size());
|
|
133
|
+
|
|
134
|
+
if (result < 0) {
|
|
135
|
+
throw std::runtime_error("Cactus score window failed: " +
|
|
136
|
+
std::string(cactus_get_last_error()));
|
|
137
|
+
}
|
|
138
|
+
|
|
139
|
+
// Remove null terminator
|
|
140
|
+
responseBuffer.resize(strlen(responseBuffer.c_str()));
|
|
141
|
+
|
|
142
|
+
return responseBuffer;
|
|
143
|
+
});
|
|
144
|
+
}
|
|
145
|
+
|
|
78
146
|
std::shared_ptr<Promise<std::string>> HybridCactus::transcribe(
|
|
79
|
-
const std::
|
|
80
|
-
|
|
147
|
+
const std::variant<std::vector<double>, std::string> &audio,
|
|
148
|
+
const std::string &prompt, double responseBufferSize,
|
|
149
|
+
const std::optional<std::string> &optionsJson,
|
|
81
150
|
const std::optional<std::function<void(const std::string & /* token */,
|
|
82
151
|
double /* tokenId */)>> &callback) {
|
|
83
|
-
return Promise<std::string>::async([this,
|
|
152
|
+
return Promise<std::string>::async([this, audio, prompt, optionsJson,
|
|
84
153
|
callback,
|
|
85
154
|
responseBufferSize]() -> std::string {
|
|
86
155
|
std::lock_guard<std::mutex> lock(this->_modelMutex);
|
|
@@ -105,14 +174,34 @@ std::shared_ptr<Promise<std::string>> HybridCactus::transcribe(
|
|
|
105
174
|
std::string responseBuffer;
|
|
106
175
|
responseBuffer.resize(responseBufferSize);
|
|
107
176
|
|
|
108
|
-
int result
|
|
109
|
-
|
|
110
|
-
|
|
111
|
-
|
|
112
|
-
|
|
177
|
+
int result;
|
|
178
|
+
if (std::holds_alternative<std::string>(audio)) {
|
|
179
|
+
result = cactus_transcribe(
|
|
180
|
+
this->_model, std::get<std::string>(audio).c_str(), prompt.c_str(),
|
|
181
|
+
responseBuffer.data(), responseBufferSize,
|
|
182
|
+
optionsJson ? optionsJson->c_str() : nullptr, cactusTokenCallback,
|
|
183
|
+
&callbackCtx, nullptr, 0);
|
|
184
|
+
} else {
|
|
185
|
+
const auto &audioDoubles = std::get<std::vector<double>>(audio);
|
|
186
|
+
|
|
187
|
+
std::vector<uint8_t> audioBytes;
|
|
188
|
+
audioBytes.reserve(audioDoubles.size());
|
|
189
|
+
|
|
190
|
+
for (double d : audioDoubles) {
|
|
191
|
+
d = std::clamp(d, 0.0, 255.0);
|
|
192
|
+
audioBytes.emplace_back(static_cast<uint8_t>(d));
|
|
193
|
+
}
|
|
194
|
+
|
|
195
|
+
result = cactus_transcribe(this->_model, nullptr, prompt.c_str(),
|
|
196
|
+
responseBuffer.data(), responseBufferSize,
|
|
197
|
+
optionsJson ? optionsJson->c_str() : nullptr,
|
|
198
|
+
cactusTokenCallback, &callbackCtx,
|
|
199
|
+
audioBytes.data(), audioBytes.size());
|
|
200
|
+
}
|
|
113
201
|
|
|
114
202
|
if (result < 0) {
|
|
115
|
-
throw std::runtime_error("Cactus
|
|
203
|
+
throw std::runtime_error("Cactus transcribe failed: " +
|
|
204
|
+
std::string(cactus_get_last_error()));
|
|
116
205
|
}
|
|
117
206
|
|
|
118
207
|
// Remove null terminator
|
|
@@ -123,9 +212,10 @@ std::shared_ptr<Promise<std::string>> HybridCactus::transcribe(
|
|
|
123
212
|
}
|
|
124
213
|
|
|
125
214
|
std::shared_ptr<Promise<std::vector<double>>>
|
|
126
|
-
HybridCactus::embed(const std::string &text, double embeddingBufferSize
|
|
215
|
+
HybridCactus::embed(const std::string &text, double embeddingBufferSize,
|
|
216
|
+
bool normalize) {
|
|
127
217
|
return Promise<std::vector<double>>::async(
|
|
128
|
-
[this, text, embeddingBufferSize]() -> std::vector<double> {
|
|
218
|
+
[this, text, embeddingBufferSize, normalize]() -> std::vector<double> {
|
|
129
219
|
std::lock_guard<std::mutex> lock(this->_modelMutex);
|
|
130
220
|
|
|
131
221
|
if (!this->_model) {
|
|
@@ -135,12 +225,13 @@ HybridCactus::embed(const std::string &text, double embeddingBufferSize) {
|
|
|
135
225
|
std::vector<float> embeddingBuffer(embeddingBufferSize);
|
|
136
226
|
size_t embeddingDim;
|
|
137
227
|
|
|
138
|
-
int result =
|
|
139
|
-
|
|
140
|
-
|
|
228
|
+
int result = cactus_embed(
|
|
229
|
+
this->_model, text.c_str(), embeddingBuffer.data(),
|
|
230
|
+
embeddingBufferSize * sizeof(float), &embeddingDim, normalize);
|
|
141
231
|
|
|
142
232
|
if (result < 0) {
|
|
143
|
-
throw std::runtime_error("Cactus
|
|
233
|
+
throw std::runtime_error("Cactus embed failed: " +
|
|
234
|
+
std::string(cactus_get_last_error()));
|
|
144
235
|
}
|
|
145
236
|
|
|
146
237
|
embeddingBuffer.resize(embeddingDim);
|
|
@@ -169,7 +260,8 @@ HybridCactus::imageEmbed(const std::string &imagePath,
|
|
|
169
260
|
embeddingBufferSize * sizeof(float), &embeddingDim);
|
|
170
261
|
|
|
171
262
|
if (result < 0) {
|
|
172
|
-
throw std::runtime_error("Cactus image
|
|
263
|
+
throw std::runtime_error("Cactus image embed failed: " +
|
|
264
|
+
std::string(cactus_get_last_error()));
|
|
173
265
|
}
|
|
174
266
|
|
|
175
267
|
embeddingBuffer.resize(embeddingDim);
|
|
@@ -198,7 +290,8 @@ HybridCactus::audioEmbed(const std::string &audioPath,
|
|
|
198
290
|
embeddingBufferSize * sizeof(float), &embeddingDim);
|
|
199
291
|
|
|
200
292
|
if (result < 0) {
|
|
201
|
-
throw std::runtime_error("Cactus audio
|
|
293
|
+
throw std::runtime_error("Cactus audio embed failed: " +
|
|
294
|
+
std::string(cactus_get_last_error()));
|
|
202
295
|
}
|
|
203
296
|
|
|
204
297
|
embeddingBuffer.resize(embeddingDim);
|
package/cpp/HybridCactus.hpp
CHANGED
|
@@ -23,15 +23,24 @@ public:
|
|
|
23
23
|
double /* tokenId */)>> &callback)
|
|
24
24
|
override;
|
|
25
25
|
|
|
26
|
+
std::shared_ptr<Promise<std::vector<double>>>
|
|
27
|
+
tokenize(const std::string &text) override;
|
|
28
|
+
|
|
29
|
+
std::shared_ptr<Promise<std::string>>
|
|
30
|
+
scoreWindow(const std::vector<double> &tokens, double start, double end,
|
|
31
|
+
double context) override;
|
|
32
|
+
|
|
26
33
|
std::shared_ptr<Promise<std::string>> transcribe(
|
|
27
|
-
const std::
|
|
28
|
-
|
|
34
|
+
const std::variant<std::vector<double>, std::string> &audio,
|
|
35
|
+
const std::string &prompt, double responseBufferSize,
|
|
36
|
+
const std::optional<std::string> &optionsJson,
|
|
29
37
|
const std::optional<std::function<void(const std::string & /* token */,
|
|
30
38
|
double /* tokenId */)>> &callback)
|
|
31
39
|
override;
|
|
32
40
|
|
|
33
41
|
std::shared_ptr<Promise<std::vector<double>>>
|
|
34
|
-
embed(const std::string &text, double embeddingBufferSize
|
|
42
|
+
embed(const std::string &text, double embeddingBufferSize,
|
|
43
|
+
bool normalize) override;
|
|
35
44
|
|
|
36
45
|
std::shared_ptr<Promise<std::vector<double>>>
|
|
37
46
|
imageEmbed(const std::string &imagePath, double embeddingBufferSize) override;
|
|
@@ -0,0 +1,325 @@
|
|
|
1
|
+
#include "HybridCactusIndex.hpp"
|
|
2
|
+
|
|
3
|
+
namespace margelo::nitro::cactus {
|
|
4
|
+
|
|
5
|
+
HybridCactusIndex::HybridCactusIndex() : HybridObject(TAG) {}
|
|
6
|
+
|
|
7
|
+
std::shared_ptr<Promise<void>>
|
|
8
|
+
HybridCactusIndex::init(const std::string &indexPath, double embeddingDim) {
|
|
9
|
+
return Promise<void>::async([this, indexPath, embeddingDim]() -> void {
|
|
10
|
+
std::lock_guard<std::mutex> lock(this->_indexMutex);
|
|
11
|
+
|
|
12
|
+
if (this->_index) {
|
|
13
|
+
throw std::runtime_error("Cactus index is already initialized");
|
|
14
|
+
}
|
|
15
|
+
|
|
16
|
+
const cactus_index_t index =
|
|
17
|
+
cactus_index_init(indexPath.c_str(), embeddingDim);
|
|
18
|
+
|
|
19
|
+
if (!index) {
|
|
20
|
+
throw std::runtime_error("Cactus index init failed: " +
|
|
21
|
+
std::string(cactus_get_last_error()));
|
|
22
|
+
}
|
|
23
|
+
|
|
24
|
+
this->_index = index;
|
|
25
|
+
this->_embeddingDim = static_cast<size_t>(embeddingDim);
|
|
26
|
+
});
|
|
27
|
+
}
|
|
28
|
+
|
|
29
|
+
std::shared_ptr<Promise<void>> HybridCactusIndex::add(
|
|
30
|
+
const std::vector<double> &ids, const std::vector<std::string> &documents,
|
|
31
|
+
const std::vector<std::vector<double>> &embeddings,
|
|
32
|
+
const std::optional<std::vector<std::string>> &metadatas) {
|
|
33
|
+
return Promise<void>::async([this, ids, documents, embeddings,
|
|
34
|
+
metadatas]() -> void {
|
|
35
|
+
std::lock_guard<std::mutex> lock(this->_indexMutex);
|
|
36
|
+
|
|
37
|
+
if (!this->_index) {
|
|
38
|
+
throw std::runtime_error("Cactus index is not initialized");
|
|
39
|
+
}
|
|
40
|
+
|
|
41
|
+
const size_t count = ids.size();
|
|
42
|
+
if (documents.size() != count || embeddings.size() != count) {
|
|
43
|
+
throw std::runtime_error(
|
|
44
|
+
"ids, documents, and embeddings must have the same length");
|
|
45
|
+
}
|
|
46
|
+
|
|
47
|
+
if (metadatas.has_value() && metadatas->size() != count) {
|
|
48
|
+
throw std::runtime_error(
|
|
49
|
+
"metadatas must have the same length as other vectors");
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
std::vector<int> intIds;
|
|
53
|
+
intIds.reserve(count);
|
|
54
|
+
for (size_t i = 0; i < count; ++i) {
|
|
55
|
+
intIds.emplace_back(static_cast<int>(ids[i]));
|
|
56
|
+
}
|
|
57
|
+
|
|
58
|
+
std::vector<const char *> documentPtrs;
|
|
59
|
+
documentPtrs.reserve(count);
|
|
60
|
+
for (size_t i = 0; i < count; ++i) {
|
|
61
|
+
documentPtrs.emplace_back(documents[i].c_str());
|
|
62
|
+
}
|
|
63
|
+
|
|
64
|
+
std::vector<std::vector<float>> embeddingsFloat(count);
|
|
65
|
+
std::vector<const float *> embeddingPtrs;
|
|
66
|
+
embeddingPtrs.reserve(count);
|
|
67
|
+
for (size_t i = 0; i < count; ++i) {
|
|
68
|
+
embeddingsFloat[i].resize(embeddings[i].size());
|
|
69
|
+
for (size_t j = 0; j < embeddings[i].size(); ++j) {
|
|
70
|
+
embeddingsFloat[i][j] = static_cast<float>(embeddings[i][j]);
|
|
71
|
+
}
|
|
72
|
+
embeddingPtrs.emplace_back(embeddingsFloat[i].data());
|
|
73
|
+
}
|
|
74
|
+
|
|
75
|
+
int result;
|
|
76
|
+
if (metadatas.has_value()) {
|
|
77
|
+
std::vector<const char *> metadataPtrs;
|
|
78
|
+
metadataPtrs.reserve(count);
|
|
79
|
+
for (size_t i = 0; i < count; ++i) {
|
|
80
|
+
metadataPtrs.emplace_back((*metadatas)[i].c_str());
|
|
81
|
+
}
|
|
82
|
+
result = cactus_index_add(
|
|
83
|
+
this->_index, intIds.data(), documentPtrs.data(), metadataPtrs.data(),
|
|
84
|
+
embeddingPtrs.data(), count, this->_embeddingDim);
|
|
85
|
+
} else {
|
|
86
|
+
result = cactus_index_add(
|
|
87
|
+
this->_index, intIds.data(), documentPtrs.data(), nullptr,
|
|
88
|
+
embeddingPtrs.data(), count, this->_embeddingDim);
|
|
89
|
+
}
|
|
90
|
+
|
|
91
|
+
if (result < 0) {
|
|
92
|
+
throw std::runtime_error("Cactus index add failed: " +
|
|
93
|
+
std::string(cactus_get_last_error()));
|
|
94
|
+
}
|
|
95
|
+
});
|
|
96
|
+
}
|
|
97
|
+
|
|
98
|
+
std::shared_ptr<Promise<void>>
|
|
99
|
+
HybridCactusIndex::_delete(const std::vector<double> &ids) {
|
|
100
|
+
return Promise<void>::async([this, ids]() -> void {
|
|
101
|
+
std::lock_guard<std::mutex> lock(this->_indexMutex);
|
|
102
|
+
|
|
103
|
+
if (!this->_index) {
|
|
104
|
+
throw std::runtime_error("Cactus index is not initialized");
|
|
105
|
+
}
|
|
106
|
+
|
|
107
|
+
std::vector<int> intIds;
|
|
108
|
+
intIds.reserve(ids.size());
|
|
109
|
+
for (size_t i = 0; i < ids.size(); ++i) {
|
|
110
|
+
intIds.emplace_back(static_cast<int>(ids[i]));
|
|
111
|
+
}
|
|
112
|
+
|
|
113
|
+
int result = cactus_index_delete(this->_index, intIds.data(), ids.size());
|
|
114
|
+
|
|
115
|
+
if (result < 0) {
|
|
116
|
+
throw std::runtime_error("Cactus index delete failed: " +
|
|
117
|
+
std::string(cactus_get_last_error()));
|
|
118
|
+
}
|
|
119
|
+
});
|
|
120
|
+
}
|
|
121
|
+
|
|
122
|
+
std::shared_ptr<Promise<CactusIndexGetResult>>
|
|
123
|
+
HybridCactusIndex::get(const std::vector<double> &ids) {
|
|
124
|
+
return Promise<CactusIndexGetResult>::async([this,
|
|
125
|
+
ids]() -> CactusIndexGetResult {
|
|
126
|
+
std::lock_guard<std::mutex> lock(this->_indexMutex);
|
|
127
|
+
|
|
128
|
+
if (!this->_index) {
|
|
129
|
+
throw std::runtime_error("Cactus index is not initialized");
|
|
130
|
+
}
|
|
131
|
+
|
|
132
|
+
const size_t count = ids.size();
|
|
133
|
+
|
|
134
|
+
std::vector<int> intIds;
|
|
135
|
+
intIds.reserve(count);
|
|
136
|
+
for (size_t i = 0; i < count; ++i) {
|
|
137
|
+
intIds.emplace_back(static_cast<int>(ids[i]));
|
|
138
|
+
}
|
|
139
|
+
|
|
140
|
+
std::vector<std::unique_ptr<char[]>> documentBuffers;
|
|
141
|
+
documentBuffers.reserve(count);
|
|
142
|
+
std::vector<std::unique_ptr<char[]>> metadataBuffers;
|
|
143
|
+
metadataBuffers.reserve(count);
|
|
144
|
+
std::vector<std::unique_ptr<float[]>> embeddingBuffers;
|
|
145
|
+
embeddingBuffers.reserve(count);
|
|
146
|
+
|
|
147
|
+
const size_t maxStringSize = 65535;
|
|
148
|
+
std::vector<size_t> documentBufferSizes(count, maxStringSize);
|
|
149
|
+
std::vector<size_t> metadataBufferSizes(count, maxStringSize);
|
|
150
|
+
std::vector<size_t> embeddingBufferSizes(count, this->_embeddingDim);
|
|
151
|
+
|
|
152
|
+
std::vector<char *> documentPtrs;
|
|
153
|
+
documentPtrs.reserve(count);
|
|
154
|
+
std::vector<char *> metadataPtrs;
|
|
155
|
+
metadataPtrs.reserve(count);
|
|
156
|
+
std::vector<float *> embeddingPtrs;
|
|
157
|
+
embeddingPtrs.reserve(count);
|
|
158
|
+
|
|
159
|
+
for (size_t i = 0; i < count; ++i) {
|
|
160
|
+
documentBuffers.emplace_back(std::make_unique<char[]>(maxStringSize));
|
|
161
|
+
documentPtrs.emplace_back(documentBuffers[i].get());
|
|
162
|
+
|
|
163
|
+
metadataBuffers.emplace_back(std::make_unique<char[]>(maxStringSize));
|
|
164
|
+
metadataPtrs.emplace_back(metadataBuffers[i].get());
|
|
165
|
+
|
|
166
|
+
embeddingBuffers.emplace_back(
|
|
167
|
+
std::make_unique<float[]>(this->_embeddingDim));
|
|
168
|
+
embeddingPtrs.emplace_back(embeddingBuffers[i].get());
|
|
169
|
+
}
|
|
170
|
+
|
|
171
|
+
int result =
|
|
172
|
+
cactus_index_get(this->_index, intIds.data(), count,
|
|
173
|
+
documentPtrs.data(), documentBufferSizes.data(),
|
|
174
|
+
metadataPtrs.data(), metadataBufferSizes.data(),
|
|
175
|
+
embeddingPtrs.data(), embeddingBufferSizes.data());
|
|
176
|
+
|
|
177
|
+
if (result < 0) {
|
|
178
|
+
throw std::runtime_error("Cactus index get failed: " +
|
|
179
|
+
std::string(cactus_get_last_error()));
|
|
180
|
+
}
|
|
181
|
+
|
|
182
|
+
CactusIndexGetResult resultObj;
|
|
183
|
+
resultObj.documents.reserve(count);
|
|
184
|
+
resultObj.metadatas.reserve(count);
|
|
185
|
+
resultObj.embeddings = std::vector<std::vector<double>>(count);
|
|
186
|
+
|
|
187
|
+
for (size_t i = 0; i < count; ++i) {
|
|
188
|
+
resultObj.documents.emplace_back(std::string(documentBuffers[i].get()));
|
|
189
|
+
resultObj.metadatas.emplace_back(std::string(metadataBuffers[i].get()));
|
|
190
|
+
|
|
191
|
+
resultObj.embeddings[i].reserve(this->_embeddingDim);
|
|
192
|
+
for (size_t j = 0; j < this->_embeddingDim; ++j) {
|
|
193
|
+
resultObj.embeddings[i].emplace_back(
|
|
194
|
+
static_cast<double>(embeddingBuffers[i].get()[j]));
|
|
195
|
+
}
|
|
196
|
+
}
|
|
197
|
+
|
|
198
|
+
return resultObj;
|
|
199
|
+
});
|
|
200
|
+
}
|
|
201
|
+
|
|
202
|
+
std::shared_ptr<Promise<CactusIndexQueryResult>>
|
|
203
|
+
HybridCactusIndex::query(const std::vector<std::vector<double>> &embeddings,
|
|
204
|
+
const std::optional<std::string> &optionsJson) {
|
|
205
|
+
return Promise<CactusIndexQueryResult>::async(
|
|
206
|
+
[this, embeddings, optionsJson]() -> CactusIndexQueryResult {
|
|
207
|
+
std::lock_guard<std::mutex> lock(this->_indexMutex);
|
|
208
|
+
|
|
209
|
+
if (!this->_index) {
|
|
210
|
+
throw std::runtime_error("Cactus index is not initialized");
|
|
211
|
+
}
|
|
212
|
+
|
|
213
|
+
const size_t count = embeddings.size();
|
|
214
|
+
|
|
215
|
+
std::vector<std::vector<float>> embeddingsFloat(count);
|
|
216
|
+
std::vector<const float *> embeddingPtrs;
|
|
217
|
+
embeddingPtrs.reserve(count);
|
|
218
|
+
for (size_t i = 0; i < count; ++i) {
|
|
219
|
+
embeddingsFloat[i].resize(embeddings[i].size());
|
|
220
|
+
for (size_t j = 0; j < embeddings[i].size(); ++j) {
|
|
221
|
+
embeddingsFloat[i][j] = static_cast<float>(embeddings[i][j]);
|
|
222
|
+
}
|
|
223
|
+
embeddingPtrs.emplace_back(embeddingsFloat[i].data());
|
|
224
|
+
}
|
|
225
|
+
|
|
226
|
+
size_t maxResults = 10;
|
|
227
|
+
if (optionsJson.has_value()) {
|
|
228
|
+
const std::string &json = *optionsJson;
|
|
229
|
+
size_t pos = json.find("\"top_k\"");
|
|
230
|
+
if (pos != std::string::npos) {
|
|
231
|
+
size_t colonPos = json.find(':', pos);
|
|
232
|
+
if (colonPos != std::string::npos) {
|
|
233
|
+
size_t numStart = json.find_first_of("0123456789", colonPos);
|
|
234
|
+
if (numStart != std::string::npos) {
|
|
235
|
+
size_t numEnd = json.find_first_not_of("0123456789", numStart);
|
|
236
|
+
std::string numStr = json.substr(numStart, numEnd - numStart);
|
|
237
|
+
maxResults = std::stoul(numStr);
|
|
238
|
+
}
|
|
239
|
+
}
|
|
240
|
+
}
|
|
241
|
+
}
|
|
242
|
+
|
|
243
|
+
std::vector<size_t> idBufferSizes(count, maxResults);
|
|
244
|
+
std::vector<size_t> scoreBufferSizes(count, maxResults);
|
|
245
|
+
|
|
246
|
+
std::vector<std::unique_ptr<int[]>> idBuffers;
|
|
247
|
+
idBuffers.reserve(count);
|
|
248
|
+
std::vector<std::unique_ptr<float[]>> scoreBuffers;
|
|
249
|
+
scoreBuffers.reserve(count);
|
|
250
|
+
|
|
251
|
+
std::vector<int *> idPtrs;
|
|
252
|
+
idPtrs.reserve(count);
|
|
253
|
+
std::vector<float *> scorePtrs;
|
|
254
|
+
scorePtrs.reserve(count);
|
|
255
|
+
|
|
256
|
+
for (size_t i = 0; i < count; ++i) {
|
|
257
|
+
idBuffers.emplace_back(std::make_unique<int[]>(maxResults));
|
|
258
|
+
idPtrs.emplace_back(idBuffers[i].get());
|
|
259
|
+
|
|
260
|
+
scoreBuffers.emplace_back(std::make_unique<float[]>(maxResults));
|
|
261
|
+
scorePtrs.emplace_back(scoreBuffers[i].get());
|
|
262
|
+
}
|
|
263
|
+
|
|
264
|
+
int result = cactus_index_query(
|
|
265
|
+
this->_index, embeddingPtrs.data(), count, this->_embeddingDim,
|
|
266
|
+
optionsJson ? optionsJson->c_str() : nullptr, idPtrs.data(),
|
|
267
|
+
idBufferSizes.data(), scorePtrs.data(), scoreBufferSizes.data());
|
|
268
|
+
|
|
269
|
+
if (result < 0) {
|
|
270
|
+
throw std::runtime_error("Cactus index query failed: " +
|
|
271
|
+
std::string(cactus_get_last_error()));
|
|
272
|
+
}
|
|
273
|
+
|
|
274
|
+
CactusIndexQueryResult resultObj;
|
|
275
|
+
resultObj.ids = std::vector<std::vector<double>>(count);
|
|
276
|
+
resultObj.scores = std::vector<std::vector<double>>(count);
|
|
277
|
+
|
|
278
|
+
for (size_t i = 0; i < count; ++i) {
|
|
279
|
+
const size_t resultCount = idBufferSizes[i];
|
|
280
|
+
resultObj.ids[i].reserve(resultCount);
|
|
281
|
+
resultObj.scores[i].reserve(resultCount);
|
|
282
|
+
|
|
283
|
+
for (size_t j = 0; j < resultCount; ++j) {
|
|
284
|
+
resultObj.ids[i].emplace_back(
|
|
285
|
+
static_cast<double>(idBuffers[i].get()[j]));
|
|
286
|
+
resultObj.scores[i].emplace_back(
|
|
287
|
+
static_cast<double>(scoreBuffers[i].get()[j]));
|
|
288
|
+
}
|
|
289
|
+
}
|
|
290
|
+
|
|
291
|
+
return resultObj;
|
|
292
|
+
});
|
|
293
|
+
}
|
|
294
|
+
|
|
295
|
+
std::shared_ptr<Promise<void>> HybridCactusIndex::compact() {
|
|
296
|
+
return Promise<void>::async([this]() -> void {
|
|
297
|
+
std::lock_guard<std::mutex> lock(this->_indexMutex);
|
|
298
|
+
|
|
299
|
+
if (!this->_index) {
|
|
300
|
+
throw std::runtime_error("Cactus index is not initialized");
|
|
301
|
+
}
|
|
302
|
+
|
|
303
|
+
int result = cactus_index_compact(this->_index);
|
|
304
|
+
|
|
305
|
+
if (result < 0) {
|
|
306
|
+
throw std::runtime_error("Cactus index compact failed: " +
|
|
307
|
+
std::string(cactus_get_last_error()));
|
|
308
|
+
}
|
|
309
|
+
});
|
|
310
|
+
}
|
|
311
|
+
|
|
312
|
+
std::shared_ptr<Promise<void>> HybridCactusIndex::destroy() {
|
|
313
|
+
return Promise<void>::async([this]() -> void {
|
|
314
|
+
std::lock_guard<std::mutex> lock(this->_indexMutex);
|
|
315
|
+
|
|
316
|
+
if (!this->_index) {
|
|
317
|
+
throw std::runtime_error("Cactus index is not initialized");
|
|
318
|
+
}
|
|
319
|
+
|
|
320
|
+
cactus_index_destroy(this->_index);
|
|
321
|
+
this->_index = nullptr;
|
|
322
|
+
});
|
|
323
|
+
}
|
|
324
|
+
|
|
325
|
+
} // namespace margelo::nitro::cactus
|
|
@@ -0,0 +1,43 @@
|
|
|
1
|
+
#pragma once
|
|
2
|
+
#include "HybridCactusIndexSpec.hpp"
|
|
3
|
+
|
|
4
|
+
#include "cactus_ffi.h"
|
|
5
|
+
|
|
6
|
+
#include <mutex>
|
|
7
|
+
|
|
8
|
+
namespace margelo::nitro::cactus {
|
|
9
|
+
|
|
10
|
+
class HybridCactusIndex : public HybridCactusIndexSpec {
|
|
11
|
+
public:
|
|
12
|
+
HybridCactusIndex();
|
|
13
|
+
|
|
14
|
+
std::shared_ptr<Promise<void>> init(const std::string &indexPath,
|
|
15
|
+
double embeddingDim) override;
|
|
16
|
+
|
|
17
|
+
std::shared_ptr<Promise<void>>
|
|
18
|
+
add(const std::vector<double> &ids, const std::vector<std::string> &documents,
|
|
19
|
+
const std::vector<std::vector<double>> &embeddings,
|
|
20
|
+
const std::optional<std::vector<std::string>> &metadatas) override;
|
|
21
|
+
|
|
22
|
+
std::shared_ptr<Promise<void>>
|
|
23
|
+
_delete(const std::vector<double> &ids) override;
|
|
24
|
+
|
|
25
|
+
std::shared_ptr<Promise<CactusIndexGetResult>>
|
|
26
|
+
get(const std::vector<double> &ids) override;
|
|
27
|
+
|
|
28
|
+
std::shared_ptr<Promise<CactusIndexQueryResult>>
|
|
29
|
+
query(const std::vector<std::vector<double>> &embeddings,
|
|
30
|
+
const std::optional<std::string> &optionsJson) override;
|
|
31
|
+
|
|
32
|
+
std::shared_ptr<Promise<void>> compact() override;
|
|
33
|
+
|
|
34
|
+
std::shared_ptr<Promise<void>> destroy() override;
|
|
35
|
+
|
|
36
|
+
private:
|
|
37
|
+
cactus_index_t _index = nullptr;
|
|
38
|
+
size_t _embeddingDim;
|
|
39
|
+
|
|
40
|
+
std::mutex _indexMutex;
|
|
41
|
+
};
|
|
42
|
+
|
|
43
|
+
} // namespace margelo::nitro::cactus
|
package/cpp/HybridCactusUtil.cpp
CHANGED
|
@@ -23,12 +23,12 @@ HybridCactusUtil::registerApp(const std::string &encryptedData) {
|
|
|
23
23
|
}
|
|
24
24
|
|
|
25
25
|
std::shared_ptr<Promise<std::optional<std::string>>>
|
|
26
|
-
HybridCactusUtil::getDeviceId() {
|
|
26
|
+
HybridCactusUtil::getDeviceId(const std::optional<std::string> &token) {
|
|
27
27
|
return Promise<std::optional<std::string>>::async(
|
|
28
|
-
[this]() -> std::optional<std::string> {
|
|
28
|
+
[this, token]() -> std::optional<std::string> {
|
|
29
29
|
std::lock_guard<std::mutex> lock(this->_mutex);
|
|
30
30
|
|
|
31
|
-
const char *deviceId = get_device_id();
|
|
31
|
+
const char *deviceId = get_device_id(token ? token->c_str() : nullptr);
|
|
32
32
|
return deviceId ? std::optional<std::string>(deviceId) : std::nullopt;
|
|
33
33
|
});
|
|
34
34
|
}
|