npm - react-native-litert-lm - Versions diffs - 0.3.4 → 0.3.6 - Mend

react-native-litert-lm 0.3.4 → 0.3.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/README.md +15 -15
package/android/CMakeLists.txt +1 -1
package/android/src/main/java/com/margelo/nitro/dev/litert/litertlm/HybridLiteRTLM.kt +41 -16
package/cpp/HybridLiteRTLM.cpp +3 -18
package/cpp/include/litert_lm_engine.h +9 -2
package/package.json +4 -4
package/scripts/build-ios-engine.sh +1 -1
package/scripts/postinstall.js +12 -5
package/ios/LiteRTLMAutolinking.mm +0 -30

package/README.md CHANGED Viewed

@@ -309,11 +309,11 @@ const buffer = tracker.getNativeBuffer();
 Download `.litertlm` models automatically using the exported URL constants, or manually from [HuggingFace](https://huggingface.co/litert-community):
-| Constant               | Model                              | Size     | Min RAM | Auth Required |
-| :--------------------- | :--------------------------------- | :------- | :------ | :------------ |
-| `GEMMA_4_E2B_IT`       | Gemma 4 E2B (Multimodal, IT)       | 2.58 GB  | 4 GB+   | ❌ No          |
-| `GEMMA_4_E4B_IT`       | Gemma 4 E4B (Higher Quality)       | 3.65 GB  | 6 GB+   | ❌ No          |
-| `GEMMA_3N_E2B_IT_INT4` | Gemma 3n E2B (Int4, Multimodal)    | ~1.3 GB  | 4 GB+   | ✅ HuggingFace |
+| Constant               | Model                           | Size    | Min RAM | Auth Required  |
+| :--------------------- | :------------------------------ | :------ | :------ | :------------- |
+| `GEMMA_4_E2B_IT`       | Gemma 4 E2B (Multimodal, IT)    | 2.58 GB | 4 GB+   | ❌ No          |
+| `GEMMA_4_E4B_IT`       | Gemma 4 E4B (Higher Quality)    | 3.65 GB | 6 GB+   | ❌ No          |
+| `GEMMA_3N_E2B_IT_INT4` | Gemma 3n E2B (Int4, Multimodal) | ~1.3 GB | 4 GB+   | ✅ HuggingFace |
 > **Recommended:** Use `GEMMA_4_E2B_IT` for most use cases. It's multimodal (text + vision + audio) and downloads directly from HuggingFace without requiring an account.
 >
@@ -452,7 +452,7 @@ const prompt = applyGemmaTemplate(
 | react-native-nitro-modules | 0.35.0+       |
 | Android API                | 26+ (ARM64)   |
 | iOS                        | 15.0+ (ARM64) |
-| LiteRT-LM Engine            | 0.10.1          |
+| LiteRT-LM Engine           | 0.10.2        |
 ## Platform Support
@@ -491,7 +491,7 @@ Add to your app's `.entitlements` file:
 ## Building the iOS Engine
-The iOS build uses a **Bazel-to-XCFramework pipeline** that compiles the LiteRT-LM C engine and all transitive dependencies into a static library (~83 MB).
+The iOS build uses a **Bazel-to-XCFramework pipeline** that compiles the LiteRT-LM C engine and all transitive dependencies into a static library (~82–84 MB).
 ### Prerequisites
@@ -506,12 +506,12 @@ The iOS build uses a **Bazel-to-XCFramework pipeline** that compiles the LiteRT-
 This will:
-1. Clone/checkout LiteRT-LM `v0.10.1` source into `.litert-lm-build/`
-2. Build `//c:engine` for `ios_arm64` and `ios_sim_arm64` via Bazel
-3. Collect all transitive `.o` files (engine, protobuf, re2, sentencepiece, etc.)
-4. Compile C/C++ stubs for unavailable Rust dependencies
-5. Patch `PromptTemplate` to use a simplified template engine (no Rust MinijinjaTemplate)
-6. Merge ~1,900 object files into a static library via `libtool`
+1. Clone/checkout LiteRT-LM `v0.10.2` source into `.litert-lm-build/`
+2. Apply `scripts/patches/ios-engine-fixes.patch` (PromptTemplate simplification, linker fixes)
+3. Build `//c:engine` for `ios_arm64` and `ios_sim_arm64` via Bazel
+4. Collect all transitive `.o` files (engine, protobuf, re2, sentencepiece, etc.)
+5. Compile C/C++ stubs for unavailable Rust dependencies
+6. Merge ~1,909 object files into a static library via `libtool`
 7. Package into `ios/Frameworks/LiteRTLM.xcframework`
 ### Output
@@ -520,10 +520,10 @@ This will:
 ios/Frameworks/LiteRTLM.xcframework/
 ├── Info.plist
 ├── ios-arm64/LiteRTLM.framework/              # Device
-│   ├── LiteRTLM                                # ~81 MB static library
+│   ├── LiteRTLM                                # ~82 MB static library
 │   └── Headers/litert_lm_engine.h
 └── ios-arm64-simulator/LiteRTLM.framework/    # Simulator
-    ├── LiteRTLM                                # ~83 MB static library
+    ├── LiteRTLM                                # ~84 MB static library
     └── Headers/litert_lm_engine.h
 ```

package/android/CMakeLists.txt CHANGED Viewed

@@ -19,7 +19,7 @@ add_library(
 # loads the NitroModules shared library. This is required because we're
 # building a library that depends on NitroModules symbols which are only
 # available at runtime.
-set(CMAKE_SHARED_LINKER_FLAGS "${CMAKE_SHARED_LINKER_FLAGS} -Wl,--allow-shlib-undefined")
+set(CMAKE_SHARED_LINKER_FLAGS "${CMAKE_SHARED_LINKER_FLAGS} -Wl,--allow-shlib-undefined,-z,max-page-size=16384")
 # Include Nitrogen autolinking - this adds all generated sources and links
 include(${CMAKE_SOURCE_DIR}/../nitrogen/generated/android/LiteRTLM+autolinking.cmake)

package/android/src/main/java/com/margelo/nitro/dev/litert/litertlm/HybridLiteRTLM.kt CHANGED Viewed

@@ -171,27 +171,40 @@ class HybridLiteRTLM : HybridLiteRTLMSpec() {
                         else -> com.google.ai.edge.litertlm.Backend.CPU()
                     }
-                    // Vision backend: hardcoded to GPU (required by Gemma models)
-                    val lmVisionBackend = com.google.ai.edge.litertlm.Backend.GPU()
-                    // Audio backend: hardcoded to CPU (optimal for audio processing)
-                    val lmAudioBackend = com.google.ai.edge.litertlm.Backend.CPU()
+                    // Detect multimodal support from model filename.
+                    // Only Gemma 3n bundles vision/audio executors; Gemma 4 E2B is text-only.
+                    // Passing vision/audio backends to a text-only model causes
+                    // vision_litert_compiled_model_executor init failures.
+                    val modelFileName = modelPath.substringAfterLast("/").lowercase()
+                    val isMultimodal = modelFileName.contains("3n") || modelFileName.contains("gemma3")
-                    Log.i(TAG, "Backend config: main=$lmBackend, vision=$lmVisionBackend (hardcoded), audio=$lmAudioBackend (hardcoded)")
+                    val lmVisionBackend = if (isMultimodal) com.google.ai.edge.litertlm.Backend.GPU() else null
+                    val lmAudioBackend = if (isMultimodal) com.google.ai.edge.litertlm.Backend.CPU() else null
+                    Log.i(TAG, "Backend config: main=$lmBackend, vision=$lmVisionBackend, audio=$lmAudioBackend, multimodal=$isMultimodal")
                     // Get cache directory from application context
                     val cacheDirectory = LiteRTLMInitProvider.applicationContext?.cacheDir?.absolutePath
                     Log.i(TAG, "Using cache directory: $cacheDirectory")
-                    // Create Engine configuration
-                    val engineConfig = EngineConfig(
-                        modelPath = modelPath,
-                        backend = lmBackend,
-                        visionBackend = lmVisionBackend,
-                        audioBackend = lmAudioBackend,
-                        maxNumTokens = maxTokens,
-                        cacheDir = cacheDirectory
-                    )
+                    // Create Engine configuration — visionBackend/audioBackend are optional
+                    val engineConfig = if (isMultimodal) {
+                        EngineConfig(
+                            modelPath = modelPath,
+                            backend = lmBackend,
+                            visionBackend = lmVisionBackend!!,
+                            audioBackend = lmAudioBackend!!,
+                            maxNumTokens = maxTokens,
+                            cacheDir = cacheDirectory
+                        )
+                    } else {
+                        EngineConfig(
+                            modelPath = modelPath,
+                            backend = lmBackend,
+                            maxNumTokens = maxTokens,
+                            cacheDir = cacheDirectory
+                        )
+                    }
                     if (isClosed) return@synchronized
@@ -615,7 +628,19 @@ class HybridLiteRTLM : HybridLiteRTLMSpec() {
     private fun createNewConversation() {
         ensureLoaded()
-        // Dispose old conversation if needed
+        // v0.10.2 enforces single-session: close existing conversation first
+        conversation?.let { oldConv ->
+            try {
+                if (oldConv is AutoCloseable) {
+                    oldConv.close()
+                } else {
+                    oldConv.javaClass.getMethod("close").invoke(oldConv)
+                }
+            } catch (e: Exception) {
+                Log.w(TAG, "Failed to close old conversation: ${e.message}")
+            }
+            conversation = null
+        }
         conversation = engine!!.createConversation()
         // Apply system prompt/instruction if set
         systemPrompt?.let { prompt ->

package/cpp/HybridLiteRTLM.cpp CHANGED Viewed

@@ -366,12 +366,7 @@ void HybridLiteRTLM::loadModelInternal(
     } else {
       diag += ", Readable: NO (errno: " + std::to_string(errno) + ")";
     }
-    // Get the native error from the C API
-    const char* nativeErr = litert_lm_get_last_error();
-    if (nativeErr && nativeErr[0] != '\0') {
-      diag += " | Native error: " + std::string(nativeErr);
-    }
     throw std::runtime_error(
       "Failed to create LiteRT-LM engine. Tried backend '" +
@@ -602,12 +597,7 @@ std::string HybridLiteRTLM::sendMessageWithImageInternal(
     conversation_, msgJson.c_str(), nullptr);
   if (!response) {
-    std::string errMsg = "LiteRT-LM: sendMessageWithImage failed";
-    const char* nativeErr = litert_lm_get_last_error();
-    if (nativeErr && nativeErr[0] != '\0') {
-      errMsg += ": " + std::string(nativeErr);
-    }
-    throw std::runtime_error(errMsg);
+    throw std::runtime_error("LiteRT-LM: sendMessageWithImage failed");
   }
   const char* responseStr = litert_lm_json_response_get_string(response);
@@ -667,12 +657,7 @@ std::string HybridLiteRTLM::sendMessageWithAudioInternal(
     conversation_, msgJson.c_str(), nullptr);
   if (!response) {
-    std::string errMsg = "LiteRT-LM: sendMessageWithAudio failed";
-    const char* nativeErr = litert_lm_get_last_error();
-    if (nativeErr && nativeErr[0] != '\0') {
-      errMsg += ": " + std::string(nativeErr);
-    }
-    throw std::runtime_error(errMsg);
+    throw std::runtime_error("LiteRT-LM: sendMessageWithAudio failed");
   }
   const char* responseStr = litert_lm_json_response_get_string(response);

package/cpp/include/litert_lm_engine.h CHANGED Viewed

@@ -182,6 +182,15 @@ LITERT_LM_C_API_EXPORT
 void litert_lm_engine_settings_set_max_num_tokens(
     LiteRtLmEngineSettings* settings, int max_num_tokens);
+// Sets whether the engine should load different sections of the litertlm file
+// in parallel. Defaults to true.
+//
+// @param settings The engine settings.
+// @param parallel_file_section_loading Whether to load in parallel.
+LITERT_LM_C_API_EXPORT
+void litert_lm_engine_settings_set_parallel_file_section_loading(
+    LiteRtLmEngineSettings* settings, bool parallel_file_section_loading);
 // Sets the cache directory for the engine.
 //
 // @param settings The engine settings.
@@ -236,14 +245,12 @@ void litert_lm_engine_settings_set_num_decode_tokens(
 // Returns an empty string if no error has occurred.
 // The returned pointer is valid until the next C API call on the same thread.
 LITERT_LM_C_API_EXPORT
-const char* litert_lm_get_last_error();
 // Creates a LiteRT LM Engine from the given settings. The caller is responsible
 // for destroying the engine using `litert_lm_engine_delete`.
 //
 // @param settings The engine settings.
 // @return A pointer to the created engine, or NULL on failure.
-//         Call litert_lm_get_last_error() for details on failure.
 LITERT_LM_C_API_EXPORT
 LiteRtLmEngine* litert_lm_engine_create(const LiteRtLmEngineSettings* settings);

package/package.json CHANGED Viewed

@@ -1,10 +1,10 @@
 {
   "name": "react-native-litert-lm",
-  "version": "0.3.4",
+  "version": "0.3.6",
   "litertLm": {
-    "version": "0.10.1",
-    "androidMavenVersion": "0.10.0",
-    "iosGitTag": "v0.10.1"
+    "version": "0.10.2",
+    "androidMavenVersion": "0.10.2",
+    "iosGitTag": "v0.10.2"
   },
   "description": "High-performance LLM inference for React Native using LiteRT-LM. Optimized for Gemma 4 and other on-device language models.",
   "license": "MIT",

package/scripts/build-ios-engine.sh CHANGED Viewed

@@ -267,7 +267,7 @@ for ARCH_NAME in "device" "simulator"; do
   <key>CFBundlePackageType</key>
   <string>FMWK</string>
   <key>CFBundleShortVersionString</key>
-  <string>0.9.0</string>
+  <string>0.10.2</string>
   <key>CFBundleVersion</key>
   <string>1</string>
   <key>MinimumOSVersion</key>

package/scripts/postinstall.js CHANGED Viewed

@@ -103,13 +103,20 @@ async function main() {
     log('iOS frameworks installed successfully.');
   } catch (err) {
-    // Don't fail the install — iOS frameworks are optional (Android-only users)
-    log(`Warning: Could not download iOS frameworks: ${err.message}`);
-    log('iOS builds will not work until frameworks are available.');
-    log('Run: scripts/download-ios-frameworks.sh to download manually.');
     // Cleanup partial download
     try { fs.unlinkSync(tmpZip); } catch {}
+    log(`Error: Could not download iOS frameworks: ${err.message}`);
+    log('iOS builds will not work until frameworks are available.');
+    log('Run: ./scripts/download-ios-frameworks.sh to download manually,');
+    log('  or: ./scripts/build-ios-engine.sh to build from source.');
+    // Fail fast on macOS so users discover the problem now, not at Xcode link time.
+    // Skip SKIP_IOS_FRAMEWORK_DOWNLOAD is already checked above.
+    if (process.platform === 'darwin') {
+      log('Set SKIP_IOS_FRAMEWORK_DOWNLOAD=1 to suppress this error (e.g. Android-only builds).');
+      process.exit(1);
+    }
   }
 }

package/ios/LiteRTLMAutolinking.mm DELETED Viewed

@@ -1,30 +0,0 @@
-///
-/// LiteRTLMAutolinking.mm
-/// Registers the C++ HybridLiteRTLM implementation with NitroModules on iOS.
-///
-/// On iOS, there's no JNI_OnLoad equivalent, so we use ObjC +load to register
-/// the HybridObject factory before JS tries to create it.
-///
-#import <Foundation/Foundation.h>
-#include <NitroModules/HybridObjectRegistry.hpp>
-#include "HybridLiteRTLM.hpp"
-@interface LiteRTLMAutolinking : NSObject
-@end
-@implementation LiteRTLMAutolinking
-+ (void)load {
-  using namespace margelo::nitro;
-  using namespace margelo::nitro::litertlm;
-  HybridObjectRegistry::registerHybridObjectConstructor(
-    "LiteRTLM",
-    []() -> std::shared_ptr<HybridObject> {
-      return std::make_shared<HybridLiteRTLM>();
-    }
-  );
-}
-@end