npm - react-native-litert-lm - Versions diffs - 0.1.1 → 0.2.1 - Mend

react-native-litert-lm 0.1.1 → 0.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

package/README.md +149 -31
package/android/src/main/java/com/margelo/nitro/dev/litert/litertlm/HybridLiteRTLM.kt +307 -61
package/cpp/HybridLiteRTLM.cpp +85 -31
package/cpp/HybridLiteRTLM.hpp +4 -0
package/cpp/include/stb_image.h +7988 -0
package/lib/hooks.d.ts +16 -0
package/lib/hooks.js +114 -0
package/lib/index.d.ts +27 -2
package/lib/index.js +50 -6
package/lib/modelFactory.d.ts +5 -0
package/lib/modelFactory.js +42 -0
package/lib/specs/LiteRTLM.nitro.d.ts +19 -0
package/lib/templates.d.ts +51 -0
package/lib/templates.js +81 -0
package/nitrogen/generated/android/LiteRTLMOnLoad.cpp +2 -0
package/nitrogen/generated/android/c++/JFunc_void_double.hpp +75 -0
package/nitrogen/generated/android/c++/JHybridLiteRTLMSpec.cpp +33 -1
package/nitrogen/generated/android/c++/JHybridLiteRTLMSpec.hpp +2 -0
package/nitrogen/generated/android/c++/JLLMConfig.hpp +6 -1
package/nitrogen/generated/android/kotlin/com/margelo/nitro/dev/litert/litertlm/Func_void_double.kt +80 -0
package/nitrogen/generated/android/kotlin/com/margelo/nitro/dev/litert/litertlm/HybridLiteRTLMSpec.kt +13 -0
package/nitrogen/generated/android/kotlin/com/margelo/nitro/dev/litert/litertlm/LLMConfig.kt +5 -2
package/nitrogen/generated/shared/c++/HybridLiteRTLMSpec.cpp +2 -0
package/nitrogen/generated/shared/c++/HybridLiteRTLMSpec.hpp +2 -0
package/nitrogen/generated/shared/c++/LLMConfig.hpp +7 -2
package/package.json +1 -1
package/src/hooks.ts +152 -0
package/src/index.ts +41 -3
package/src/modelFactory.ts +49 -0
package/src/specs/LiteRTLM.nitro.ts +26 -0
package/src/templates.ts +105 -0

package/cpp/HybridLiteRTLM.cpp CHANGED Viewed

@@ -11,9 +11,13 @@
 #include "HybridLiteRTLM.hpp"
+#define STB_IMAGE_IMPLEMENTATION
+#include "include/stb_image.h"
 #include <chrono>
 #include <stdexcept>
 #include <sstream>
+#include <fstream>
 namespace margelo::nitro::litertlm {
@@ -229,32 +233,46 @@ std::string HybridLiteRTLM::sendMessageWithImage(
   ensureLoaded();
 #ifdef LITERT_LM_ENABLED
-  // TODO: Load image file into raw pixel buffer
-  // The Engine expects raw RGBA/RGB data, not a file path.
-  // Implementation should:
-  // 1. Read image file (using stb_image.h or Android Bitmap JNI)
-  // 2. Decode to raw pixel buffer (std::vector<uint8_t>)
-  // 3. Create litert::lm::ImageData or equivalent tensor
-  // 4. Pass to conversation_->SendMessage with multimodal content
-  // For now, fall back to text-only with a note about the image
-  std::string augmentedMessage = message + " [Image attached: " + imagePath +
-    " - Note: Image processing not yet implemented, text-only response]";
+  // Load image using stb_image
+  int width, height, channels;
+  unsigned char* img = stbi_load(imagePath.c_str(), &width, &height, &channels, 3); // Force 3 channels (RGB)
+  if (img == nullptr) {
+    throw std::runtime_error("Failed to load image from path: " + imagePath);
+  }
+  // Create input tensor/buffer for the engine.
+  // Note: The exact API for passing image data depends on the LiteRT-LM version.
+  // Assuming a structure that accepts raw bytes and dimensions.
   litert::lm::UserMessage lm_message;
   lm_message.role = "user";
-  lm_message.content = augmentedMessage;
+  // Construct multimodal content
+  // Option A: If UserMessage supports a list of content parts
+  litert::lm::ContentPart textPart;
+  textPart.type = litert::lm::ContentType::TEXT;
+  textPart.text = message;
+  lm_message.parts.push_back(textPart);
+  litert::lm::ContentPart imagePart;
+  imagePart.type = litert::lm::ContentType::IMAGE;
+  imagePart.image.width = width;
+  imagePart.image.height = height;
+  imagePart.image.channels = channels;
+  imagePart.image.data = std::vector<uint8_t>(img, img + (width * height * channels));
+  lm_message.parts.push_back(imagePart);
+  stbi_image_free(img);
   auto response = conversation_->SendMessage(lm_message);
   if (!response.ok()) {
     throw std::runtime_error("Multimodal inference failed: " +
         std::string(response.status().message()));
   }
-  // Add to history
+  // Add to history (metadata only)
   Message userMessage;
   userMessage.role = Role::USER;
-  userMessage.content = message + " [with image]";
+  userMessage.content = message + " [Image]";
   history_.push_back(userMessage);
   Message modelMessage;
@@ -265,11 +283,34 @@ std::string HybridLiteRTLM::sendMessageWithImage(
   return response->content;
 #else
-  // Stub: just process text with image path noted
-  return sendMessage(message + " [Image: " + imagePath + "]");
+  // iOS: LiteRT-LM SDK not yet available, throw clear error
+  throw std::runtime_error(
+      "sendMessageWithImage is not supported on iOS. "
+      "LiteRT-LM iOS SDK is not yet available. "
+      "Please use text-only sendMessage() for now.");
+#endif
+}
 #endif
 }
+//------------------------------------------------------------------------------
+// downloadModel - Download model file from URL
+//------------------------------------------------------------------------------
+std::future<std::string> HybridLiteRTLM::downloadModel(
+    const std::string& url,
+    const std::string& fileName,
+    const std::optional<std::function<void(double)>>& onProgress) {
+  // Return a future that throws an exception
+  return std::async(std::launch::async, []() -> std::string {
+    throw std::runtime_error(
+        "downloadModel is not supported on iOS yet. "
+        "Please download the model manually using a separate library."
+    );
+  });
+}
 //------------------------------------------------------------------------------
 // sendMessageWithAudio - Multimodal audio + text
 //------------------------------------------------------------------------------
@@ -281,31 +322,41 @@ std::string HybridLiteRTLM::sendMessageWithAudio(
   ensureLoaded();
 #ifdef LITERT_LM_ENABLED
-  // TODO: Load audio file into raw sample buffer
-  // Similar to image - Engine expects raw audio samples, not file path.
-  // Implementation should:
-  // 1. Read WAV file header and samples
-  // 2. Convert to expected format (likely 16kHz mono float32)
-  // 3. Create litert::lm::AudioData or equivalent
-  // 4. Pass to conversation with multimodal content
+  // Load audio file
+  std::ifstream audioFile(audioPath, std::ios::binary);
+  if (!audioFile) {
+      throw std::runtime_error("Failed to open audio file: " + audioPath);
+  }
-  std::string augmentedMessage = message + " [Audio attached: " + audioPath +
-    " - Note: Audio processing not yet implemented, text-only response]";
+  // Simple WAV header skip (simplistic, assuming standard header size for now or raw)
+  // Ideally use a WAV parsing library or miniaudio if available.
+  // For this implementation, we read the whole file.
+  std::vector<uint8_t> audioData((std::istreambuf_iterator<char>(audioFile)), std::istreambuf_iterator<char>());
   litert::lm::UserMessage lm_message;
   lm_message.role = "user";
-  lm_message.content = augmentedMessage;
+  litert::lm::ContentPart textPart;
+  textPart.type = litert::lm::ContentType::TEXT;
+  textPart.text = message;
+  lm_message.parts.push_back(textPart);
+  litert::lm::ContentPart audioPart;
+  audioPart.type = litert::lm::ContentType::AUDIO;
+  audioPart.audio.data = audioData;
+  // Metadata like sample rate might be needed:
+  // audioPart.audio.sample_rate = 16000;
+  lm_message.parts.push_back(audioPart);
   auto response = conversation_->SendMessage(lm_message);
   if (!response.ok()) {
     throw std::runtime_error("Audio inference failed: " +
         std::string(response.status().message()));
   }
-  // Add to history
   Message userMessage;
   userMessage.role = Role::USER;
-  userMessage.content = message + " [with audio]";
+  userMessage.content = message + " [Audio]";
   history_.push_back(userMessage);
   Message modelMessage;
@@ -316,8 +367,11 @@ std::string HybridLiteRTLM::sendMessageWithAudio(
   return response->content;
 #else
-  // Stub: just process text with audio path noted
-  return sendMessage(message + " [Audio: " + audioPath + "]");
+  // iOS: LiteRT-LM SDK not yet available, throw clear error
+  throw std::runtime_error(
+      "sendMessageWithAudio is not supported on iOS. "
+      "LiteRT-LM iOS SDK is not yet available. "
+      "Please use text-only sendMessage() for now.");
 #endif
 }

package/cpp/HybridLiteRTLM.hpp CHANGED Viewed

@@ -58,6 +58,10 @@ public:
   std::string sendMessageWithImage(const std::string& message,
                                    const std::string& imagePath) override;
+  std::future<std::string> downloadModel(const std::string& url,
+                                         const std::string& fileName,
+                                         const std::optional<std::function<void(double)>>& onProgress) override;
   std::string sendMessageWithAudio(const std::string& message,
                                    const std::string& audioPath) override;