cui-llama.rn 1.2.4 → 1.2.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/cpp/llama.h CHANGED
@@ -2,6 +2,7 @@
2
2
  #define LLAMA_H
3
3
 
4
4
  #include "ggml.h"
5
+ #include "ggml-cpu.h"
5
6
  #include "ggml-backend.h"
6
7
 
7
8
  #include <stddef.h>
@@ -206,7 +207,7 @@ extern "C" {
206
207
  enum llama_split_mode {
207
208
  LLAMA_SPLIT_MODE_NONE = 0, // single GPU
208
209
  LLAMA_SPLIT_MODE_LAYER = 1, // split layers and KV across GPUs
209
- LLAMA_SPLIT_MODE_ROW = 2, // split rows across GPUs
210
+ LLAMA_SPLIT_MODE_ROW = 2, // split layers and KV across GPUs, use tensor parallelism if supported
210
211
  };
211
212
 
212
213
  // TODO: simplify (https://github.com/ggerganov/llama.cpp/pull/9294#pullrequestreview-2286561979)
@@ -275,10 +276,7 @@ extern "C" {
275
276
  int32_t n_gpu_layers; // number of layers to store in VRAM
276
277
  enum llama_split_mode split_mode; // how to split the model across multiple GPUs
277
278
 
278
- // main_gpu interpretation depends on split_mode:
279
- // LLAMA_SPLIT_MODE_NONE: the GPU that is used for the entire model
280
- // LLAMA_SPLIT_MODE_ROW: the GPU that is used for small tensors and intermediate results
281
- // LLAMA_SPLIT_MODE_LAYER: ignored
279
+ // the GPU that is used for the entire model when split_mode is LLAMA_SPLIT_MODE_NONE
282
280
  int32_t main_gpu;
283
281
 
284
282
  // proportion of the model (layers or rows) to offload to each GPU, size: llama_max_devices()
@@ -1088,12 +1086,6 @@ extern "C" {
1088
1086
  /// @details Minimum P sampling as described in https://github.com/ggerganov/llama.cpp/pull/3841
1089
1087
  LLAMA_API struct llama_sampler * llama_sampler_init_min_p (float p, size_t min_keep);
1090
1088
 
1091
- /// @details XTC sampling as described in https://github.com/oobabooga/text-generation-webui/pull/6335
1092
- LLAMA_API struct llama_sampler * llama_sampler_init_xtc (float xtc_p, float xtc_t, size_t min_keep, uint32_t seed);
1093
-
1094
- /// @details Tail Free Sampling described in https://www.trentonbricken.com/Tail-Free-Sampling/.
1095
- LLAMA_API struct llama_sampler * llama_sampler_init_tail_free (float z, size_t min_keep);
1096
-
1097
1089
  /// @details Locally Typical Sampling implementation described in the paper https://arxiv.org/abs/2202.00666.
1098
1090
  LLAMA_API struct llama_sampler * llama_sampler_init_typical (float p, size_t min_keep);
1099
1091
 
@@ -1145,6 +1137,16 @@ extern "C" {
1145
1137
  bool penalize_nl, // consider newlines as a repeatable token
1146
1138
  bool ignore_eos); // ignore the end-of-sequence token
1147
1139
 
1140
+ /// @details DRY sampler, designed by p-e-w, as described in: https://github.com/oobabooga/text-generation-webui/pull/5677, porting Koboldcpp implementation authored by pi6am: https://github.com/LostRuins/koboldcpp/pull/982
1141
+ LLAMA_API struct llama_sampler * llama_sampler_init_dry(
1142
+ const struct llama_model * model,
1143
+ float dry_multiplier,
1144
+ float dry_base,
1145
+ int32_t dry_allowed_length,
1146
+ int32_t dry_penalty_last_n,
1147
+ const char ** seq_breakers,
1148
+ size_t num_breakers);
1149
+
1148
1150
  LLAMA_API struct llama_sampler * llama_sampler_init_logit_bias(
1149
1151
  int32_t n_vocab,
1150
1152
  int32_t n_logit_bias,
package/cpp/sampling.cpp CHANGED
@@ -130,10 +130,12 @@ std::string common_sampler_params::print() const {
130
130
 
131
131
  snprintf(result, sizeof(result),
132
132
  "\trepeat_last_n = %d, repeat_penalty = %.3f, frequency_penalty = %.3f, presence_penalty = %.3f\n"
133
- "\ttop_k = %d, tfs_z = %.3f, top_p = %.3f, min_p = %.3f, xtc_probability = %.3f, xtc_threshold = %.3f, typical_p = %.3f, temp = %.3f\n"
133
+ "\tdry_multiplier = %.3f, dry_base = %.3f, dry_allowed_length = %d, dry_penalty_last_n = %d\n"
134
+ "\ttop_k = %d, top_p = %.3f, min_p = %.3f, xtc_probability = %.3f, xtc_threshold = %.3f, typical_p = %.3f, temp = %.3f\n"
134
135
  "\tmirostat = %d, mirostat_lr = %.3f, mirostat_ent = %.3f",
135
136
  penalty_last_n, penalty_repeat, penalty_freq, penalty_present,
136
- top_k, tfs_z, top_p, min_p, xtc_probability, xtc_threshold, typ_p, temp,
137
+ dry_multiplier, dry_base, dry_allowed_length, dry_penalty_last_n,
138
+ top_k, top_p, min_p, xtc_probability, xtc_threshold, typ_p, temp,
137
139
  mirostat, mirostat_eta, mirostat_tau);
138
140
 
139
141
  return std::string(result);
@@ -174,6 +176,17 @@ struct common_sampler * common_sampler_init(const struct llama_model * model, co
174
176
  if (params.mirostat == 0) {
175
177
  for (const auto & cnstr : params.samplers) {
176
178
  switch (cnstr) {
179
+ case COMMON_SAMPLER_TYPE_DRY:
180
+ {
181
+ std::vector<const char*> c_breakers;
182
+ c_breakers.reserve(params.dry_sequence_breakers.size());
183
+ for (const auto& str : params.dry_sequence_breakers) {
184
+ c_breakers.push_back(str.c_str());
185
+ }
186
+
187
+ llama_sampler_chain_add(result->chain, llama_sampler_init_dry (model, params.dry_multiplier, params.dry_base, params.dry_allowed_length, params.dry_penalty_last_n, c_breakers.data(), c_breakers.size()));
188
+ }
189
+ break;
177
190
  case COMMON_SAMPLER_TYPE_TOP_K:
178
191
  llama_sampler_chain_add(result->chain, llama_sampler_init_top_k (params.top_k));
179
192
  break;
@@ -186,9 +199,6 @@ struct common_sampler * common_sampler_init(const struct llama_model * model, co
186
199
  case COMMON_SAMPLER_TYPE_XTC:
187
200
  llama_sampler_chain_add(result->chain, llama_sampler_init_xtc (params.xtc_probability, params.xtc_threshold, params.min_keep, params.seed));
188
201
  break;
189
- case COMMON_SAMPLER_TYPE_TFS_Z:
190
- llama_sampler_chain_add(result->chain, llama_sampler_init_tail_free(params.tfs_z, params.min_keep));
191
- break;
192
202
  case COMMON_SAMPLER_TYPE_TYPICAL_P:
193
203
  llama_sampler_chain_add(result->chain, llama_sampler_init_typical (params.typ_p, params.min_keep));
194
204
  break;
@@ -358,8 +368,8 @@ std::string common_sampler_prev_str(common_sampler * gsmpl, llama_context * ctx_
358
368
 
359
369
  char common_sampler_type_to_chr(enum common_sampler_type cnstr) {
360
370
  switch (cnstr) {
371
+ case COMMON_SAMPLER_TYPE_DRY: return 'd';
361
372
  case COMMON_SAMPLER_TYPE_TOP_K: return 'k';
362
- case COMMON_SAMPLER_TYPE_TFS_Z: return 'f';
363
373
  case COMMON_SAMPLER_TYPE_TYPICAL_P: return 'y';
364
374
  case COMMON_SAMPLER_TYPE_TOP_P: return 'p';
365
375
  case COMMON_SAMPLER_TYPE_MIN_P: return 'm';
@@ -372,8 +382,8 @@ char common_sampler_type_to_chr(enum common_sampler_type cnstr) {
372
382
 
373
383
  std::string common_sampler_type_to_str(enum common_sampler_type cnstr) {
374
384
  switch (cnstr) {
385
+ case COMMON_SAMPLER_TYPE_DRY: return "dry";
375
386
  case COMMON_SAMPLER_TYPE_TOP_K: return "top_k";
376
- case COMMON_SAMPLER_TYPE_TFS_Z: return "tfs_z";
377
387
  case COMMON_SAMPLER_TYPE_TYPICAL_P: return "typ_p";
378
388
  case COMMON_SAMPLER_TYPE_TOP_P: return "top_p";
379
389
  case COMMON_SAMPLER_TYPE_MIN_P: return "min_p";
@@ -386,11 +396,11 @@ std::string common_sampler_type_to_str(enum common_sampler_type cnstr) {
386
396
 
387
397
  std::vector<common_sampler_type> common_sampler_types_from_names(const std::vector<std::string> & names, bool allow_alt_names) {
388
398
  std::unordered_map<std::string, common_sampler_type> sampler_canonical_name_map {
399
+ { "dry", COMMON_SAMPLER_TYPE_DRY },
389
400
  { "top_k", COMMON_SAMPLER_TYPE_TOP_K },
390
401
  { "top_p", COMMON_SAMPLER_TYPE_TOP_P },
391
402
  { "typ_p", COMMON_SAMPLER_TYPE_TYPICAL_P },
392
403
  { "min_p", COMMON_SAMPLER_TYPE_MIN_P },
393
- { "tfs_z", COMMON_SAMPLER_TYPE_TFS_Z },
394
404
  { "temperature", COMMON_SAMPLER_TYPE_TEMPERATURE },
395
405
  { "xtc", COMMON_SAMPLER_TYPE_XTC },
396
406
  { "infill", COMMON_SAMPLER_TYPE_INFILL },
@@ -407,8 +417,6 @@ std::vector<common_sampler_type> common_sampler_types_from_names(const std::vect
407
417
  { "typ-p", COMMON_SAMPLER_TYPE_TYPICAL_P },
408
418
  { "typ", COMMON_SAMPLER_TYPE_TYPICAL_P },
409
419
  { "min-p", COMMON_SAMPLER_TYPE_MIN_P },
410
- { "tfs-z", COMMON_SAMPLER_TYPE_TFS_Z },
411
- { "tfs", COMMON_SAMPLER_TYPE_TFS_Z },
412
420
  { "temp", COMMON_SAMPLER_TYPE_TEMPERATURE },
413
421
  };
414
422
 
@@ -434,8 +442,8 @@ std::vector<common_sampler_type> common_sampler_types_from_names(const std::vect
434
442
 
435
443
  std::vector<common_sampler_type> common_sampler_types_from_chars(const std::string & chars) {
436
444
  std::unordered_map<char, common_sampler_type> sampler_name_map = {
445
+ { common_sampler_type_to_chr(COMMON_SAMPLER_TYPE_DRY), COMMON_SAMPLER_TYPE_DRY },
437
446
  { common_sampler_type_to_chr(COMMON_SAMPLER_TYPE_TOP_K), COMMON_SAMPLER_TYPE_TOP_K },
438
- { common_sampler_type_to_chr(COMMON_SAMPLER_TYPE_TFS_Z), COMMON_SAMPLER_TYPE_TFS_Z },
439
447
  { common_sampler_type_to_chr(COMMON_SAMPLER_TYPE_TYPICAL_P), COMMON_SAMPLER_TYPE_TYPICAL_P },
440
448
  { common_sampler_type_to_chr(COMMON_SAMPLER_TYPE_TOP_P), COMMON_SAMPLER_TYPE_TOP_P },
441
449
  { common_sampler_type_to_chr(COMMON_SAMPLER_TYPE_MIN_P), COMMON_SAMPLER_TYPE_MIN_P },
package/cpp/sgemm.cpp CHANGED
@@ -942,6 +942,36 @@ class tinyBLAS_Q0_AVX {
942
942
  return _mm_sub_epi8(_mm_and_si128(_mm_set1_epi8(15), _mm_srli_epi16(x, 4)), _mm_set1_epi8(8));
943
943
  }
944
944
 
945
+ inline __m256i load(const block_q5_0 *b) {
946
+ return _mm256_or_si256(denibble(b->qs), bittobyte(b->qh));
947
+ }
948
+
949
+ inline __m128i load0(const block_q5_0* b) {
950
+ const __m128i x = _mm_loadu_si128((const __m128i *)(b->qs));
951
+ uint32_t x32;
952
+ memcpy(&x32, b->qh, sizeof(uint32_t));
953
+ __m128i qxl = _mm_and_si128(_mm_set1_epi8(15), x);
954
+ __m128i bytesl = _mm_cmpeq_epi8(_mm_set1_epi64x(-1),
955
+ _mm_or_si128(_mm_set1_epi64x(0x7fbfdfeff7fbfdfe),
956
+ _mm_shuffle_epi8(_mm_set1_epi32(x32),
957
+ _mm_set_epi64x(0x0101010101010101, 0x0000000000000000))));
958
+ bytesl = _mm_andnot_si128(bytesl, _mm_set1_epi8((char)0xF0));
959
+ return _mm_or_si128(qxl, bytesl);
960
+ }
961
+
962
+ inline __m128i load1(const block_q5_0* b) {
963
+ const __m128i x = _mm_loadu_si128((const __m128i *)(b->qs));
964
+ uint32_t x32;
965
+ memcpy(&x32, b->qh, sizeof(uint32_t));
966
+ __m128i qxh = _mm_and_si128(_mm_set1_epi8(15), _mm_srli_epi16(x, 4));
967
+ __m128i bytesh = _mm_cmpeq_epi8(_mm_set1_epi64x(-1),
968
+ _mm_or_si128(_mm_set1_epi64x(0x7fbfdfeff7fbfdfe),
969
+ _mm_shuffle_epi8(_mm_set1_epi32(x32),
970
+ _mm_set_epi64x(0x0303030303030303, 0x0202020202020202))));
971
+ bytesh = _mm_andnot_si128(bytesh, _mm_set1_epi8((char)0xF0));
972
+ return _mm_or_si128(qxh, bytesh);
973
+ }
974
+
945
975
  inline __m256i load(const block_iq4_nl *b) {
946
976
  return MM256_SET_M128I(load1(b), load0(b));
947
977
  }
@@ -973,6 +1003,17 @@ class tinyBLAS_Q0_AVX {
973
1003
  _mm_srli_epi16(x, 4), 1));
974
1004
  }
975
1005
 
1006
+ static inline __m256i bittobyte(const uint8_t *p) {
1007
+ uint32_t x32;
1008
+ memcpy(&x32, p, sizeof(uint32_t));
1009
+ __m256i bytes = _mm256_cmpeq_epi8(_mm256_set1_epi64x(-1),
1010
+ _mm256_or_si256(_mm256_set1_epi64x(0x7fbfdfeff7fbfdfe),
1011
+ _mm256_shuffle_epi8(_mm256_set1_epi32(x32),
1012
+ _mm256_set_epi64x(0x0303030303030303, 0x0202020202020202,
1013
+ 0x0101010101010101, 0x0000000000000000))));
1014
+ return _mm256_andnot_si256(bytes, _mm256_set1_epi8((char)0xF0));
1015
+ }
1016
+
976
1017
  const TA *const A;
977
1018
  const TB *const B;
978
1019
  TC *const C;
@@ -1182,6 +1223,22 @@ bool llamafile_sgemm(int64_t m, int64_t n, int64_t k, const void *A, int64_t lda
1182
1223
  #endif
1183
1224
  }
1184
1225
 
1226
+ case LM_GGML_TYPE_Q5_0: {
1227
+ if (Btype != LM_GGML_TYPE_Q8_0)
1228
+ return false;
1229
+ #if defined(__AVX2__) || defined(__AVX512F__) || defined(__AVX__)
1230
+ tinyBLAS_Q0_AVX<block_q5_0, block_q8_0, float> tb{
1231
+ k, (const block_q5_0 *)A, lda,
1232
+ (const block_q8_0 *)B, ldb,
1233
+ (float *)C, ldc,
1234
+ ith, nth};
1235
+ tb.matmul(m, n);
1236
+ return true;
1237
+ #else
1238
+ return false;
1239
+ #endif
1240
+ }
1241
+
1185
1242
  case LM_GGML_TYPE_IQ4_NL: {
1186
1243
  if (Btype != LM_GGML_TYPE_Q8_0)
1187
1244
  return false;
@@ -1 +1 @@
1
- {"version":3,"names":["_reactNative","require","_default","TurboModuleRegistry","get","exports","default"],"sourceRoot":"..\\..\\src","sources":["NativeRNLlama.ts"],"mappings":";;;;;;AACA,IAAAA,YAAA,GAAAC,OAAA;AAAkD,IAAAC,QAAA,GAsKnCC,gCAAmB,CAACC,GAAG,CAAO,SAAS,CAAC;AAAAC,OAAA,CAAAC,OAAA,GAAAJ,QAAA"}
1
+ {"version":3,"names":["_reactNative","require","_default","TurboModuleRegistry","get","exports","default"],"sourceRoot":"..\\..\\src","sources":["NativeRNLlama.ts"],"mappings":";;;;;;AACA,IAAAA,YAAA,GAAAC,OAAA;AAAkD,IAAAC,QAAA,GAqKnCC,gCAAmB,CAACC,GAAG,CAAO,SAAS,CAAC;AAAAC,OAAA,CAAAC,OAAA,GAAAJ,QAAA"}
@@ -1 +1 @@
1
- {"version":3,"names":["TurboModuleRegistry","get"],"sourceRoot":"..\\..\\src","sources":["NativeRNLlama.ts"],"mappings":"AACA,SAASA,mBAAmB,QAAQ,cAAc;AAsKlD,eAAeA,mBAAmB,CAACC,GAAG,CAAO,SAAS,CAAC"}
1
+ {"version":3,"names":["TurboModuleRegistry","get"],"sourceRoot":"..\\..\\src","sources":["NativeRNLlama.ts"],"mappings":"AACA,SAASA,mBAAmB,QAAQ,cAAc;AAqKlD,eAAeA,mBAAmB,CAACC,GAAG,CAAO,SAAS,CAAC"}
@@ -27,7 +27,6 @@ export type NativeCompletionParams = {
27
27
  min_p?: number;
28
28
  xtc_t?: number;
29
29
  xtc_p?: number;
30
- tfs_z?: number;
31
30
  typical_p?: number;
32
31
  temperature?: number;
33
32
  penalty_last_n?: number;
@@ -1 +1 @@
1
- {"version":3,"file":"NativeRNLlama.d.ts","sourceRoot":"","sources":["../../src/NativeRNLlama.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,WAAW,EAAE,MAAM,cAAc,CAAA;AAG/C,MAAM,MAAM,mBAAmB,GAAG;IAChC,KAAK,EAAE,MAAM,CAAA;IACb,cAAc,CAAC,EAAE,OAAO,CAAA;IAExB,SAAS,CAAC,EAAE,OAAO,CAAA;IAEnB,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,OAAO,CAAC,EAAE,MAAM,CAAA;IAEhB,SAAS,CAAC,EAAE,MAAM,CAAA;IAClB,YAAY,CAAC,EAAE,MAAM,CAAA;IAErB,SAAS,CAAC,EAAE,OAAO,CAAA;IACnB,QAAQ,CAAC,EAAE,OAAO,CAAA;IAClB,UAAU,CAAC,EAAE,OAAO,CAAA;IAEpB,IAAI,CAAC,EAAE,MAAM,CAAA;IACb,WAAW,CAAC,EAAE,MAAM,CAAA;IAEpB,cAAc,CAAC,EAAE,MAAM,CAAA;IACvB,eAAe,CAAC,EAAE,MAAM,CAAA;CACzB,CAAA;AAED,MAAM,MAAM,sBAAsB,GAAG;IACnC,MAAM,EAAE,MAAM,CAAA;IACd,OAAO,CAAC,EAAE,MAAM,CAAA;IAChB,IAAI,CAAC,EAAE,KAAK,CAAC,MAAM,CAAC,CAAA;IAEpB,SAAS,CAAC,EAAE,MAAM,CAAA;IAClB,SAAS,CAAC,EAAE,MAAM,CAAA;IAClB,OAAO,CAAC,EAAE,MAAM,CAAA;IAChB,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,SAAS,CAAC,EAAE,MAAM,CAAA;IAClB,WAAW,CAAC,EAAE,MAAM,CAAA;IACpB,cAAc,CAAC,EAAE,MAAM,CAAA;IACvB,cAAc,CAAC,EAAE,MAAM,CAAA;IACvB,YAAY,CAAC,EAAE,MAAM,CAAA;IACrB,eAAe,CAAC,EAAE,MAAM,CAAA;IACxB,QAAQ,CAAC,EAAE,MAAM,CAAA;IACjB,YAAY,CAAC,EAAE,MAAM,CAAA;IACrB,YAAY,CAAC,EAAE,MAAM,CAAA;IACrB,WAAW,CAAC,EAAE,OAAO,CAAA;IACrB,IAAI,CAAC,EAAE,MAAM,CAAA;IAEb,UAAU,CAAC,EAAE,OAAO,CAAA;IACpB,UAAU,CAAC,EAAE,KAAK,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAA;IAEjC,uBAAuB,EAAE,OAAO,CAAA;CACjC,CAAA;AAED,MAAM,MAAM,6BAA6B,GAAG;IAC1C,OAAO,EAAE,MAAM,CAAA;IACf,IAAI,EAAE,MAAM,CAAA;CACb,CAAA;AAED,MAAM,MAAM,yBAAyB,GAAG;IACtC,OAAO,EAAE,MAAM,CAAA;IACf,KAAK,EAAE,KAAK,CAAC,6BAA6B,CAAC,CAAA;CAC5C,CAAA;AAED,MAAM,MAAM,6BAA6B,GAAG;IAC1C,QAAQ,EAAE,MAAM,CAAA;IAChB,SAAS,EAAE,MAAM,CAAA;IACjB,mBAAmB,EAAE,MAAM,CAAA;IAC3B,iBAAiB,EAAE,MAAM,CAAA;IACzB,WAAW,EAAE,MAAM,CAAA;IACnB,YAAY,EAAE,MAAM,CAAA;IACpB,sBAAsB,EAAE,MAAM,CAAA;IAC9B,oBAAoB,EAAE,MAAM,CAAA;CAC7B,CAAA;AAED,MAAM,MAAM,sBAAsB,GAAG;IACnC,IAAI,EAAE,MAAM,CAAA;IAEZ,gBAAgB,EAAE,MAAM,CAAA;IACxB,gBAAgB,EAAE,MAAM,CAAA;IACxB,SAAS,EAAE,OAAO,CAAA;IAClB,WAAW,EAAE,OAAO,CAAA;IACpB,YAAY,EAAE,MAAM,CAAA;IACpB,aAAa,EAAE,MAAM,CAAA;IACrB,aAAa,EAAE,MAAM,CAAA;IACrB,aAAa,EAAE,MAAM,CAAA;IACrB,OAAO,EAAE,6BAA6B,CAAA;IAEtC,wBAAwB,CAAC,EAAE,KAAK,CAAC,yBAAyB,CAAC,CAAA;CAC5D,CAAA;AAED,MAAM,MAAM,oBAAoB,GAAG;IACjC,MAAM,EAAE,KAAK,CAAC,MAAM,CAAC,CAAA;CACtB,CAAA;AAED,MAAM,MAAM,qBAAqB,GAAG;IAClC,SAAS,EAAE,KAAK,CAAC,MAAM,CAAC,CAAA;CACzB,CAAA;AAED,MAAM,MAAM,kBAAkB,GAAG;IAC/B,SAAS,EAAE,MAAM,CAAA;IACjB,GAAG,EAAE,OAAO,CAAA;IACZ,WAAW,EAAE,MAAM,CAAA;IACnB,KAAK,EAAE,MAAM,CAAA;CACd,CAAA;AAED,MAAM,MAAM,uBAAuB,GAAG;IACpC,aAAa,EAAE,MAAM,CAAA;IACrB,MAAM,EAAE,MAAM,CAAA;CACf,CAAA;AAED,MAAM,MAAM,sBAAsB,GAAG;IACnC,IAAI,EAAE,MAAM,CAAA;IACZ,OAAO,EAAE,MAAM,CAAA;CAChB,CAAA;AAED,MAAM,MAAM,iBAAiB,GAAG;IAC9B,KAAK,EAAE,OAAO,CAAA;IACd,IAAI,EAAE,OAAO,CAAA;IACb,OAAO,EAAE,OAAO,CAAA;CACjB,CAAA;AAED,MAAM,WAAW,IAAK,SAAQ,WAAW;IACvC,eAAe,CAAC,KAAK,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC,CAAA;IAC7C,WAAW,CAAC,MAAM,EAAE,mBAAmB,GAAG,OAAO,CAAC,kBAAkB,CAAC,CAAA;IAErE,WAAW,CACT,SAAS,EAAE,MAAM,EACjB,QAAQ,EAAE,MAAM,GACf,OAAO,CAAC,uBAAuB,CAAC,CAAA;IACnC,WAAW,CACT,SAAS,EAAE,MAAM,EACjB,QAAQ,EAAE,MAAM,EAChB,IAAI,EAAE,MAAM,GACX,OAAO,CAAC,MAAM,CAAC,CAAA;IAClB,UAAU,CACR,SAAS,EAAE,MAAM,EACjB,MAAM,EAAE,sBAAsB,GAC7B,OAAO,CAAC,sBAAsB,CAAC,CAAA;IAClC,cAAc,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC,CAAA;IAChD,aAAa,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,oBAAoB,CAAC,CAAA;IAC7E,YAAY,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,GAAG,oBAAoB,CAAA;IACnE,cAAc,IAAK,OAAO,CAAC,iBAAiB,CAAC,CAAA;IAC7C,gBAAgB,CACd,SAAS,EAAE,MAAM,EACjB,QAAQ,EAAE,sBAAsB,EAAE,EAClC,YAAY,CAAC,EAAE,MAAM,GACpB,OAAO,CAAC,MAAM,CAAC,CAAA;IAClB,UAAU,CAAC,SAAS,EAAE,MAAM,EAAE,MAAM,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IAChE,SAAS,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,qBAAqB,CAAC,CAAA;IAC1E,KAAK,CACH,SAAS,EAAE,MAAM,EACjB,EAAE,EAAE,MAAM,EACV,EAAE,EAAE,MAAM,EACV,EAAE,EAAE,MAAM,EACV,EAAE,EAAE,MAAM,GACT,OAAO,CAAC,MAAM,CAAC,CAAA;IAElB,cAAc,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC,CAAA;IAEhD,kBAAkB,IAAI,OAAO,CAAC,IAAI,CAAC,CAAA;CACpC;;AAED,wBAA+D"}
1
+ {"version":3,"file":"NativeRNLlama.d.ts","sourceRoot":"","sources":["../../src/NativeRNLlama.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,WAAW,EAAE,MAAM,cAAc,CAAA;AAG/C,MAAM,MAAM,mBAAmB,GAAG;IAChC,KAAK,EAAE,MAAM,CAAA;IACb,cAAc,CAAC,EAAE,OAAO,CAAA;IAExB,SAAS,CAAC,EAAE,OAAO,CAAA;IAEnB,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,OAAO,CAAC,EAAE,MAAM,CAAA;IAEhB,SAAS,CAAC,EAAE,MAAM,CAAA;IAClB,YAAY,CAAC,EAAE,MAAM,CAAA;IAErB,SAAS,CAAC,EAAE,OAAO,CAAA;IACnB,QAAQ,CAAC,EAAE,OAAO,CAAA;IAClB,UAAU,CAAC,EAAE,OAAO,CAAA;IAEpB,IAAI,CAAC,EAAE,MAAM,CAAA;IACb,WAAW,CAAC,EAAE,MAAM,CAAA;IAEpB,cAAc,CAAC,EAAE,MAAM,CAAA;IACvB,eAAe,CAAC,EAAE,MAAM,CAAA;CACzB,CAAA;AAED,MAAM,MAAM,sBAAsB,GAAG;IACnC,MAAM,EAAE,MAAM,CAAA;IACd,OAAO,CAAC,EAAE,MAAM,CAAA;IAChB,IAAI,CAAC,EAAE,KAAK,CAAC,MAAM,CAAC,CAAA;IAEpB,SAAS,CAAC,EAAE,MAAM,CAAA;IAClB,SAAS,CAAC,EAAE,MAAM,CAAA;IAClB,OAAO,CAAC,EAAE,MAAM,CAAA;IAChB,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,KAAK,CAAC,EAAE,MAAM,CAAA;IACd,SAAS,CAAC,EAAE,MAAM,CAAA;IAClB,WAAW,CAAC,EAAE,MAAM,CAAA;IACpB,cAAc,CAAC,EAAE,MAAM,CAAA;IACvB,cAAc,CAAC,EAAE,MAAM,CAAA;IACvB,YAAY,CAAC,EAAE,MAAM,CAAA;IACrB,eAAe,CAAC,EAAE,MAAM,CAAA;IACxB,QAAQ,CAAC,EAAE,MAAM,CAAA;IACjB,YAAY,CAAC,EAAE,MAAM,CAAA;IACrB,YAAY,CAAC,EAAE,MAAM,CAAA;IACrB,WAAW,CAAC,EAAE,OAAO,CAAA;IACrB,IAAI,CAAC,EAAE,MAAM,CAAA;IAEb,UAAU,CAAC,EAAE,OAAO,CAAA;IACpB,UAAU,CAAC,EAAE,KAAK,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAA;IAEjC,uBAAuB,EAAE,OAAO,CAAA;CACjC,CAAA;AAED,MAAM,MAAM,6BAA6B,GAAG;IAC1C,OAAO,EAAE,MAAM,CAAA;IACf,IAAI,EAAE,MAAM,CAAA;CACb,CAAA;AAED,MAAM,MAAM,yBAAyB,GAAG;IACtC,OAAO,EAAE,MAAM,CAAA;IACf,KAAK,EAAE,KAAK,CAAC,6BAA6B,CAAC,CAAA;CAC5C,CAAA;AAED,MAAM,MAAM,6BAA6B,GAAG;IAC1C,QAAQ,EAAE,MAAM,CAAA;IAChB,SAAS,EAAE,MAAM,CAAA;IACjB,mBAAmB,EAAE,MAAM,CAAA;IAC3B,iBAAiB,EAAE,MAAM,CAAA;IACzB,WAAW,EAAE,MAAM,CAAA;IACnB,YAAY,EAAE,MAAM,CAAA;IACpB,sBAAsB,EAAE,MAAM,CAAA;IAC9B,oBAAoB,EAAE,MAAM,CAAA;CAC7B,CAAA;AAED,MAAM,MAAM,sBAAsB,GAAG;IACnC,IAAI,EAAE,MAAM,CAAA;IAEZ,gBAAgB,EAAE,MAAM,CAAA;IACxB,gBAAgB,EAAE,MAAM,CAAA;IACxB,SAAS,EAAE,OAAO,CAAA;IAClB,WAAW,EAAE,OAAO,CAAA;IACpB,YAAY,EAAE,MAAM,CAAA;IACpB,aAAa,EAAE,MAAM,CAAA;IACrB,aAAa,EAAE,MAAM,CAAA;IACrB,aAAa,EAAE,MAAM,CAAA;IACrB,OAAO,EAAE,6BAA6B,CAAA;IAEtC,wBAAwB,CAAC,EAAE,KAAK,CAAC,yBAAyB,CAAC,CAAA;CAC5D,CAAA;AAED,MAAM,MAAM,oBAAoB,GAAG;IACjC,MAAM,EAAE,KAAK,CAAC,MAAM,CAAC,CAAA;CACtB,CAAA;AAED,MAAM,MAAM,qBAAqB,GAAG;IAClC,SAAS,EAAE,KAAK,CAAC,MAAM,CAAC,CAAA;CACzB,CAAA;AAED,MAAM,MAAM,kBAAkB,GAAG;IAC/B,SAAS,EAAE,MAAM,CAAA;IACjB,GAAG,EAAE,OAAO,CAAA;IACZ,WAAW,EAAE,MAAM,CAAA;IACnB,KAAK,EAAE,MAAM,CAAA;CACd,CAAA;AAED,MAAM,MAAM,uBAAuB,GAAG;IACpC,aAAa,EAAE,MAAM,CAAA;IACrB,MAAM,EAAE,MAAM,CAAA;CACf,CAAA;AAED,MAAM,MAAM,sBAAsB,GAAG;IACnC,IAAI,EAAE,MAAM,CAAA;IACZ,OAAO,EAAE,MAAM,CAAA;CAChB,CAAA;AAED,MAAM,MAAM,iBAAiB,GAAG;IAC9B,KAAK,EAAE,OAAO,CAAA;IACd,IAAI,EAAE,OAAO,CAAA;IACb,OAAO,EAAE,OAAO,CAAA;CACjB,CAAA;AAED,MAAM,WAAW,IAAK,SAAQ,WAAW;IACvC,eAAe,CAAC,KAAK,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC,CAAA;IAC7C,WAAW,CAAC,MAAM,EAAE,mBAAmB,GAAG,OAAO,CAAC,kBAAkB,CAAC,CAAA;IAErE,WAAW,CACT,SAAS,EAAE,MAAM,EACjB,QAAQ,EAAE,MAAM,GACf,OAAO,CAAC,uBAAuB,CAAC,CAAA;IACnC,WAAW,CACT,SAAS,EAAE,MAAM,EACjB,QAAQ,EAAE,MAAM,EAChB,IAAI,EAAE,MAAM,GACX,OAAO,CAAC,MAAM,CAAC,CAAA;IAClB,UAAU,CACR,SAAS,EAAE,MAAM,EACjB,MAAM,EAAE,sBAAsB,GAC7B,OAAO,CAAC,sBAAsB,CAAC,CAAA;IAClC,cAAc,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC,CAAA;IAChD,aAAa,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,oBAAoB,CAAC,CAAA;IAC7E,YAAY,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,GAAG,oBAAoB,CAAA;IACnE,cAAc,IAAK,OAAO,CAAC,iBAAiB,CAAC,CAAA;IAC7C,gBAAgB,CACd,SAAS,EAAE,MAAM,EACjB,QAAQ,EAAE,sBAAsB,EAAE,EAClC,YAAY,CAAC,EAAE,MAAM,GACpB,OAAO,CAAC,MAAM,CAAC,CAAA;IAClB,UAAU,CAAC,SAAS,EAAE,MAAM,EAAE,MAAM,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,MAAM,CAAC,CAAA;IAChE,SAAS,CAAC,SAAS,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,qBAAqB,CAAC,CAAA;IAC1E,KAAK,CACH,SAAS,EAAE,MAAM,EACjB,EAAE,EAAE,MAAM,EACV,EAAE,EAAE,MAAM,EACV,EAAE,EAAE,MAAM,EACV,EAAE,EAAE,MAAM,GACT,OAAO,CAAC,MAAM,CAAC,CAAA;IAElB,cAAc,CAAC,SAAS,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC,CAAA;IAEhD,kBAAkB,IAAI,OAAO,CAAC,IAAI,CAAC,CAAA;CACpC;;AAED,wBAA+D"}
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "cui-llama.rn",
3
- "version": "1.2.4",
3
+ "version": "1.2.6",
4
4
  "description": "Fork of llama.rn for ChatterUI",
5
5
  "main": "lib/commonjs/index",
6
6
  "module": "lib/module/index",
@@ -37,7 +37,6 @@ export type NativeCompletionParams = {
37
37
  min_p?: number
38
38
  xtc_t?: number
39
39
  xtc_p?: number
40
- tfs_z?: number
41
40
  typical_p?: number
42
41
  temperature?: number // -> temp
43
42
  penalty_last_n?: number