npm - cui-llama.rn - Versions diffs - 1.7.3 → 1.7.6 - Mend

cui-llama.rn 1.7.3 → 1.7.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (276) hide show

package/src/index.ts CHANGED Viewed

@@ -12,6 +12,8 @@ import type {
   NativeSessionLoadResult,
   NativeCPUFeatures,
   NativeEmbeddingParams,
+  NativeRerankParams,
+  NativeRerankResult,
   NativeCompletionTokenProbItem,
   NativeCompletionResultTimings,
   JinjaFormattedChatResult,
@@ -53,6 +55,8 @@ export type {
   NativeEmbeddingResult,
   NativeSessionLoadResult,
   NativeEmbeddingParams,
+  NativeRerankParams,
+  NativeRerankResult,
   NativeCompletionTokenProbItem,
   NativeCompletionResultTimings,
   FormattedChatResult,
@@ -128,6 +132,16 @@ export type ContextParams = Omit<
 export type EmbeddingParams = NativeEmbeddingParams
+export type RerankParams = {
+  normalize?: number
+}
+export type RerankResult = {
+  score: number
+  index: number
+  document?: string
+}
 export type CompletionResponseFormat = {
   type: 'text' | 'json_object' | 'json_schema'
   json_schema?: {
@@ -227,7 +241,8 @@ export class LlamaContext {
       response_format?: CompletionResponseFormat
       tools?: object
       parallel_tool_calls?: object
-      tool_choice?: string
+      tool_choice?: string,
+      enable_thinking?: boolean,
     },
   ): Promise<FormattedChatResult | JinjaFormattedChatResult> {
     const mediaPaths: string[] = []
@@ -290,6 +305,7 @@ export class LlamaContext {
           ? JSON.stringify(params.parallel_tool_calls)
           : undefined,
         tool_choice: params?.tool_choice,
+        enable_thinking: params?.enable_thinking ?? true,
       },
     )
     if (!useJinja) {
@@ -336,6 +352,7 @@ export class LlamaContext {
           tools: params.tools,
           parallel_tool_calls: params.parallel_tool_calls,
           tool_choice: params.tool_choice,
+          enable_thinking: params.enable_thinking,
         },
       )
       if (formattedResult.type === 'jinja') {
@@ -446,6 +463,29 @@ export class LlamaContext {
     return RNLlama.embedding(this.id, text, params || {})
   }
+  /**
+   * Rerank documents based on relevance to a query
+   * @param query The query text to rank documents against
+   * @param documents Array of document texts to rank
+   * @param params Optional reranking parameters
+   * @returns Promise resolving to an array of ranking results with scores and indices
+   */
+  async rerank(
+    query: string,
+    documents: string[],
+    params?: RerankParams,
+  ): Promise<RerankResult[]> {
+    const results = await RNLlama.rerank(this.id, query, documents, params || {})
+    // Sort by score descending and add document text if requested
+    return results
+      .map((result) => ({
+        ...result,
+        document: documents[result.index],
+      }))
+      .sort((a, b) => b.score - a.score)
+  }
   async bench(
     pp: number,
     tg: number,
@@ -536,6 +576,70 @@ export class LlamaContext {
     return await RNLlama.releaseMultimodal(this.id)
   }
+  /**
+   * Initialize TTS support with a vocoder model
+   * @param params Parameters for TTS support
+   * @param params.path Path to the vocoder model
+   * @returns Promise resolving to true if initialization was successful
+   */
+  async initVocoder({ path }: { path: string }): Promise<boolean> {
+    if (path.startsWith('file://')) path = path.slice(7)
+    return await RNLlama.initVocoder(this.id, path)
+  }
+  /**
+   * Check if TTS support is enabled
+   * @returns Promise resolving to true if TTS is enabled
+   */
+  async isVocoderEnabled(): Promise<boolean> {
+    return await RNLlama.isVocoderEnabled(this.id)
+  }
+  /**
+   * Get a formatted audio completion prompt
+   * @param speakerJsonStr JSON string representing the speaker
+   * @param textToSpeak Text to speak
+   * @returns Promise resolving to the formatted audio completion prompt
+   */
+  async getFormattedAudioCompletion(
+    speaker: object | null,
+    textToSpeak: string,
+  ): Promise<string> {
+    return await RNLlama.getFormattedAudioCompletion(
+      this.id,
+      speaker ? JSON.stringify(speaker) : '',
+      textToSpeak,
+    )
+  }
+  /**
+   * Get guide tokens for audio completion
+   * @param textToSpeak Text to speak
+   * @returns Promise resolving to the guide tokens
+   */
+  async getAudioCompletionGuideTokens(
+    textToSpeak: string,
+  ): Promise<Array<number>> {
+    return await RNLlama.getAudioCompletionGuideTokens(this.id, textToSpeak)
+  }
+  /**
+   * Decode audio tokens
+   * @param tokens Array of audio tokens
+   * @returns Promise resolving to the decoded audio tokens
+   */
+  async decodeAudioTokens(tokens: number[]): Promise<Array<number>> {
+    return await RNLlama.decodeAudioTokens(this.id, tokens)
+  }
+  /**
+   * Release TTS support
+   * @returns Promise resolving to void
+   */
+  async releaseVocoder(): Promise<void> {
+    return await RNLlama.releaseVocoder(this.id)
+  }
   async release(): Promise<void> {
     return RNLlama.releaseContext(this.id)
   }

package/cpp/ggml-cpu/ggml-cpu-aarch64.h DELETED Viewed

@@ -1,8 +0,0 @@
-#pragma once
-#include "ggml-cpu-traits.h"
-#include "ggml.h"
-// GGML internal header
-lm_ggml_backend_buffer_type_t lm_ggml_backend_cpu_aarch64_buffer_type(void);