npm - @omote/core - Versions diffs - 0.5.7 → 0.6.4 - Mend

@omote/core 0.5.7 → 0.6.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/README.md CHANGED Viewed

@@ -35,11 +35,7 @@ The most common use case: feed TTS audio chunks and get back 52 ARKit blendshape
 import { FullFacePipeline, createA2E } from '@omote/core';
 // 1. Create A2E backend (auto-detects GPU vs CPU)
-const lam = createA2E({
-  gpuModelUrl: '/models/lam-wav2vec2.onnx',
-  cpuModelUrl: '/models/wav2arkit_cpu.onnx',
-  mode: 'auto',
-});
+const lam = createA2E(); // auto-detects GPU vs CPU, fetches from HF CDN (192MB fp16)
 await lam.load();
 // 2. Create pipeline with expression profile
@@ -72,12 +68,7 @@ Auto-detects platform: Chrome/Edge/Android use WebGPU, Safari/iOS use WASM CPU f
 ```typescript
 import { createA2E } from '@omote/core';
-const a2e = createA2E({
-  gpuModelUrl: '/models/lam-wav2vec2.onnx',       // 384MB, WebGPU
-  cpuModelUrl: '/models/wav2arkit_cpu.onnx',        // 404MB, WASM
-  mode: 'auto',            // 'auto' | 'gpu' | 'cpu'
-  fallbackOnError: true,   // GPU failure → auto-switch to CPU
-});
+const a2e = createA2E(); // auto-detects: GPU (192MB fp16) or CPU (404MB WASM)
 await a2e.load();
 const { blendshapes } = await a2e.infer(audioSamples); // Float32Array (16kHz)
@@ -89,7 +80,7 @@ const { blendshapes } = await a2e.infer(audioSamples); // Float32Array (16kHz)
 ```typescript
 import { Wav2Vec2Inference, LAM_BLENDSHAPES } from '@omote/core';
-const lam = new Wav2Vec2Inference({ modelUrl: '/models/lam-wav2vec2.onnx' });
+const lam = new Wav2Vec2Inference({ modelUrl: '/models/model_fp16.onnx' });
 await lam.load();
 const { blendshapes } = await lam.infer(audioSamples);
@@ -317,7 +308,7 @@ Place models in your public assets directory:
 ```
 public/models/
-  lam-wav2vec2.onnx              # A2E lip sync — WebGPU (384MB)
+  model_fp16.onnx                 # A2E lip sync — WebGPU (192MB fp16, from omote-ai/lam-a2e)
   wav2arkit_cpu.onnx              # A2E lip sync — WASM fallback (1.86MB graph)
   wav2arkit_cpu.onnx.data         # A2E lip sync — WASM fallback (402MB weights)
   sensevoice/model.int8.onnx      # SenseVoice ASR (239MB)