RubyGems - llama_cpp - Versions diffs - 0.21.2 → 0.22.1 - Mend

llama_cpp 0.21.2 → 0.22.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 5f3d80e415240f21df0ba7e314118712f6f2d2d8cb052eef41127e7de7ae7e51
-  data.tar.gz: 67fff55bf83ef4d97f24b0c3c450eb493464763c23595fcb5b60c248fd1f551e
+  metadata.gz: d9d289500d478dbaea942656eeaf4c076dd81fdcbf5fe670c323c5ce431945da
+  data.tar.gz: 5dff9d66db034b7f275add566e760adf84b10b578ff9a2fb32a684fd17735f8a
 SHA512:
-  metadata.gz: f6a129952bc812c130a235743beeb0a5ebcafcbe627d7d13d625e8cf5b143e2cb41cd4d78cfacc98c00a1d0857dc68bb8a6b30d486da5f22e8bcbc6a63ac5489
-  data.tar.gz: c944f2a37727bd3e295dc83d9d9c5c5748a04d7f867aad86895c312a100fa65b7c3fa9f3973bf08adc47c26c2a0e73586f7aa92b92230bee72c86b10dc4693fc
+  metadata.gz: 6b3109cee58c80d79ba90aa3ec33e0517c8bb54a1592ff4020ca18e16bf78c0bed5389ac1c5dd1221e757c87c8e3fb1af226c45d5b3d2a5b1ee6bc7afd13e242
+  data.tar.gz: 139cb66ec6cd2adbd2b178ad7f84581698905870bb549105f9683e14a80d04d8210405762e98937fed685352a4434d89f8fe43d8cbf500b1396d091c7d6366ba

data/CHANGELOG.md CHANGED Viewed

@@ -1,3 +1,27 @@
+## [[0.22.1](https://github.com/yoshoku/llama_cpp.rb/compare/v0.22.0...v0.22.1)] - 2025-08-30
+- Change supported llama.cpp version to b6310.
+  - Add `llama_adapter_meta_count` module function.
+## [[0.22.0](https://github.com/yoshoku/llama_cpp.rb/compare/v0.21.2...v0.22.0)] - 2025-08-23
+- Change supported llama.cpp version to b6240.
+  - Add `llama_state_seq_get_size_ext` module function.
+  - Add `LLAMA_STATE_SEQ_FLAGS_SWA_ONLY` constant.
+  - Remove `LlamaKvCache` class.
+  - Remove `llama_get_kv_self` module function.
+  - Remove ` llama_get_kv_self_clear` module function.
+  - Remove `llama_kv_self_seq_rm` module function.
+  - Remove `llama_kv_self_seq_cp` module function.
+  - Remove `llama_kv_self_seq_keep` module function.
+  - Remove `llama_kv_self_seq_add` module function.
+  - Remove `llama_kv_self_seq_div` module function.
+  - Remove `llama_kv_self_seq_pos_min` module function.
+  - Remove `llama_kv_self_seq_pos_max` module function.
+  - Remove `llama_kv_self_deflag` module function.
+  - Remove `llama_kv_self_can_shift?` module function.
+  - Remove `llama_kv_self_update` module function.
 ## [[0.21.2](https://github.com/yoshoku/llama_cpp.rb/compare/v0.21.1...v0.21.2)] - 2025-08-09
 - Change supported llama.cpp version to b6100.

data/ext/llama_cpp/llama_cpp.c CHANGED Viewed

@@ -11,7 +11,6 @@ VALUE rb_cLlamaModelQuantizeParams;
 VALUE rb_cLlamaLogitBias;
 VALUE rb_cLlamaAdapterLora;
 VALUE rb_cLlamaMemoryT;
-VALUE rb_cLlamaKvCache;
 VALUE rb_cLlamaTokenDataArray;
 VALUE rb_cLlamaBatch;
 VALUE rb_cLlamaSampler;
@@ -1853,6 +1852,20 @@ static VALUE rb_llama_adapter_lora_init(VALUE self, VALUE model, VALUE path_lora
   return TypedData_Wrap_Struct(rb_cLlamaAdapterLora, &llama_adapter_lora_wrapper_data_type, adapter_wrapper);
 }
+/**
+ * @overload llama_adapter_meta_count(adapter)
+ * @param [LlamaAdapterLora] adapter
+ * @return [Integer]
+ */
+static VALUE rb_llama_adapter_meta_count(VALUE self, VALUE adapter) {
+  if (!rb_obj_is_kind_of(adapter, rb_cLlamaAdapterLora)) {
+    rb_raise(rb_eArgError, "adapter must be a LlamaAdapterLora");
+    return Qnil;
+  }
+  llama_adapter_lora_wrapper* adapter_wrapper = get_llama_adapter_lora_wrapper(adapter);
+  return INT2NUM(llama_adapter_meta_count(adapter_wrapper->adapter));
+}
 /**
  * @overload llama_set_adapter_lora(context, adapter, scale)
  *  @param [LlamaContext] context
@@ -2172,264 +2185,29 @@ static VALUE rb_llama_get_memory(VALUE self, VALUE ctx) {
   return TypedData_Wrap_Struct(rb_cLlamaMemoryT, &llama_memory_t_wrapper_data_type, memory_wrapper);
 }
-/* llama_kv_cache wrapper */
-typedef struct {
-  struct llama_kv_cache* kv_cache;
-} llama_kv_cache_wrapper;
-static void llama_kv_cache_wrapper_free(void *ptr) {
-  if (ptr) {
-    ruby_xfree(ptr);
-  }
-}
-static size_t llama_kv_cache_wrapper_size(const void *ptr) {
-  return sizeof(*((llama_kv_cache_wrapper*)ptr));
-}
-static rb_data_type_t llama_kv_cache_wrapper_data_type = {
-  "LlamaKvCache",
-  { NULL,
-    llama_kv_cache_wrapper_free,
-    llama_kv_cache_wrapper_size },
-  NULL,
-  NULL,
-  RUBY_TYPED_FREE_IMMEDIATELY
-};
-static VALUE llama_kv_cache_wrapper_alloc(VALUE self) {
-  llama_kv_cache_wrapper* data = (llama_kv_cache_wrapper*)ruby_xmalloc(sizeof(llama_kv_cache_wrapper));
-  data->kv_cache = NULL;
-  return TypedData_Wrap_Struct(self, &llama_kv_cache_wrapper_data_type, data);
-}
-// static llama_kv_cache_wrapper* get_llama_kv_cache_wrapper(VALUE self) {
-//   llama_kv_cache_wrapper* data = NULL;
-//   TypedData_Get_Struct(self, llama_kv_cache_wrapper, &llama_kv_cache_wrapper_data_type, data);
-//   return data;
-// }
-/**
- * @overload llama_get_kv_self(context)
- *  @param [LlamaContext] context
- *  @return [LlamaKvCache]
- */
-static VALUE rb_llama_get_kv_self(VALUE self, VALUE ctx) {
-  if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
-    rb_raise(rb_eArgError, "ctx must be a LlamaContext");
-    return Qnil;
-  }
-  llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  llama_kv_cache_wrapper* kv_cache_wrapper = (llama_kv_cache_wrapper*)ruby_xmalloc(sizeof(llama_kv_cache_wrapper));
-  kv_cache_wrapper->kv_cache = llama_get_kv_self(context_wrapper->context);
-  RB_GC_GUARD(ctx);
-  return TypedData_Wrap_Struct(rb_cLlamaKvCache, &llama_kv_cache_wrapper_data_type, kv_cache_wrapper);
-}
-/**
- * @overload llama_kv_self_clear(context)
- *  @param [LlamaContext] context
- *  @return [NilClass]
- */
-static VALUE rb_llama_kv_self_clear(VALUE self, VALUE ctx) {
-  if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
-    rb_raise(rb_eArgError, "ctx must be a LlamaContext");
-    return Qnil;
-  }
-  llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  llama_kv_self_clear(context_wrapper->context);
-  RB_GC_GUARD(ctx);
-  return Qnil;
-}
-/**
- * @overload llama_kv_self_seq_rm(context, seq_id, p0, p1)
- *  @param [LlamaContext] context
- *  @param [Integer] seq_id
- *  @param [Integer] p0
- *  @param [Integer] p1
- *  @return [Boolean]
- */
-static VALUE rb_llama_kv_self_seq_rm(VALUE self, VALUE ctx, VALUE seq_id, VALUE p0, VALUE p1) {
-  if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
-    rb_raise(rb_eArgError, "ctx must be a LlamaContext");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(seq_id)) {
-    rb_raise(rb_eArgError, "seq_id must be an Integer");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(p0)) {
-    rb_raise(rb_eArgError, "p0 must be an Integer");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(p1)) {
-    rb_raise(rb_eArgError, "p1 must be an Integer");
-    return Qnil;
-  }
-  llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  const bool res = llama_kv_self_seq_rm(context_wrapper->context, NUM2INT(seq_id), NUM2INT(p0), NUM2INT(p1));
-  RB_GC_GUARD(ctx);
-  return res ? Qtrue : Qfalse;
-}
-/**
- * @overload llama_kv_self_seq_cp(context, seq_id_src, seq_id_dst, p0, p1)
- *  @param [LlamaContext] context
- *  @param [Integer] seq_id_src
- *  @param [Integer] seq_id_dst
- *  @param [Integer] p0
- *  @param [Integer] p1
- *  @return [NilClass]
- */
-static VALUE rb_llama_kv_self_seq_cp(VALUE self, VALUE ctx, VALUE seq_id_src, VALUE seq_id_dst, VALUE p0, VALUE p1) {
-  if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
-    rb_raise(rb_eArgError, "ctx must be a LlamaContext");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(seq_id_src)) {
-    rb_raise(rb_eArgError, "seq_id_src must be an Integer");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(seq_id_dst)) {
-    rb_raise(rb_eArgError, "seq_id_dst must be an Integer");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(p0)) {
-    rb_raise(rb_eArgError, "p0 must be an Integer");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(p1)) {
-    rb_raise(rb_eArgError, "p1 must be an Integer");
-    return Qnil;
-  }
-  llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  llama_kv_self_seq_cp(context_wrapper->context, NUM2INT(seq_id_src), NUM2INT(seq_id_dst), NUM2INT(p0), NUM2INT(p1));
-  RB_GC_GUARD(ctx);
-  return Qnil;
-}
-/**
- * @overload llama_kv_self_seq_keep(context, seq_id)
- *  @param [LlamaContext] context
- *  @param [Integer] seq_id
- *  @return [NilClass]
- */
-static VALUE rb_llama_kv_self_seq_keep(VALUE self, VALUE ctx, VALUE seq_id) {
-  if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
-    rb_raise(rb_eArgError, "ctx must be a LlamaContext");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(seq_id)) {
-    rb_raise(rb_eArgError, "seq_id must be an Integer");
-    return Qnil;
-  }
-  llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  llama_kv_self_seq_keep(context_wrapper->context, NUM2INT(seq_id));
-  RB_GC_GUARD(ctx);
-  return Qnil;
-}
-/**
- * @overload llama_kv_self_seq_add(context, seq_id, p0, p1, delta)
- *  @param [LlamaContext] context
- *  @param [Integer] seq_id
- *  @param [Integer] p0
- *  @param [Integer] p1
- *  @param [Integer] delta
- *  @return [NilClass]
- */
-static VALUE rb_llama_kv_self_seq_add(VALUE self, VALUE ctx, VALUE seq_id, VALUE p0, VALUE p1, VALUE delta) {
-  if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
-    rb_raise(rb_eArgError, "ctx must be a LlamaContext");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(seq_id)) {
-    rb_raise(rb_eArgError, "seq_id must be an Integer");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(p0)) {
-    rb_raise(rb_eArgError, "p0 must be an Integer");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(p1)) {
-    rb_raise(rb_eArgError, "p1 must be an Integer");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(delta)) {
-    rb_raise(rb_eArgError, "delta must be an Integer");
-    return Qnil;
-  }
-  llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  llama_kv_self_seq_add(context_wrapper->context, NUM2INT(seq_id), NUM2INT(p0), NUM2INT(p1), NUM2INT(delta));
-  RB_GC_GUARD(ctx);
-  return Qnil;
-}
 /**
- * @overload llama_kv_self_seq_div(context, seq_id, p0, p1, d)
- *  @param [LlamaContext] context
- *  @param [Integer] seq_id
- *  @param [Integer] p0
- *  @param [Integer] p1
- *  @param [Integer] d
- *  @return [NilClass]
- */
-static VALUE rb_llama_kv_self_seq_div(VALUE self, VALUE ctx, VALUE seq_id, VALUE p0, VALUE p1, VALUE d) {
-  if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
-    rb_raise(rb_eArgError, "ctx must be a LlamaContext");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(seq_id)) {
-    rb_raise(rb_eArgError, "seq_id must be an Integer");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(p0)) {
-    rb_raise(rb_eArgError, "p0 must be an Integer");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(p1)) {
-    rb_raise(rb_eArgError, "p1 must be an Integer");
-    return Qnil;
-  }
-  if (!RB_INTEGER_TYPE_P(d)) {
-    rb_raise(rb_eArgError, "d must be an Integer");
-    return Qnil;
-  }
-  llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  llama_kv_self_seq_div(context_wrapper->context, NUM2INT(seq_id), NUM2INT(p0), NUM2INT(p1), NUM2INT(d));
-  RB_GC_GUARD(ctx);
-  return Qnil;
-}
-/**
- * @overload llama_kv_self_seq_pos_min(context, seq_id)
+ * @overload llama_state_get_size(context)
  *  @param [LlamaContext] context
- *  @param [Integer] seq_id
  *  @return [Integer]
  */
-static VALUE rb_llama_kv_self_seq_pos_min(VALUE self, VALUE ctx, VALUE seq_id) {
+static VALUE rb_llama_state_get_size(VALUE self, VALUE ctx) {
   if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
     rb_raise(rb_eArgError, "ctx must be a LlamaContext");
     return Qnil;
   }
-  if (!RB_INTEGER_TYPE_P(seq_id)) {
-    rb_raise(rb_eArgError, "seq_id must be an Integer");
-    return Qnil;
-  }
   llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  const int32_t pos_max = llama_kv_self_seq_pos_min(context_wrapper->context, NUM2INT(seq_id));
+  const size_t size = llama_state_get_size(context_wrapper->context);
   RB_GC_GUARD(ctx);
-  return INT2NUM(pos_max);
+  return SIZET2NUM(size);
 }
 /**
- * @overload llama_kv_self_seq_pos_max(context, seq_id)
+ * @overload llama_state_seq_get_size(context, seq_id)
  *  @param [LlamaContext] context
  *  @param [Integer] seq_id
  *  @return [Integer]
  */
-static VALUE rb_llama_kv_self_seq_pos_max(VALUE self, VALUE ctx, VALUE seq_id) {
+static VALUE rb_llama_state_seq_get_size(VALUE self, VALUE ctx, VALUE seq_id) {
   if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
     rb_raise(rb_eArgError, "ctx must be a LlamaContext");
     return Qnil;
@@ -2439,82 +2217,19 @@ static VALUE rb_llama_kv_self_seq_pos_max(VALUE self, VALUE ctx, VALUE seq_id) {
     return Qnil;
   }
   llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  const int32_t pos_max = llama_kv_self_seq_pos_max(context_wrapper->context, NUM2INT(seq_id));
-  RB_GC_GUARD(ctx);
-  return INT2NUM(pos_max);
-}
-/**
- * @overload llama_kv_self_defrag(context)
- *  @param [LlamaContext] context
- *  @return [NilClass]
- */
-static VALUE rb_llama_kv_self_defrag(VALUE self, VALUE ctx) {
-  if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
-    rb_raise(rb_eArgError, "ctx must be a LlamaContext");
-    return Qnil;
-  }
-  llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  llama_kv_self_defrag(context_wrapper->context);
-  RB_GC_GUARD(ctx);
-  return Qnil;
-}
-/**
- * @overload llama_kv_self_update(context)
- *  @param [LlamaContext] context
- *  @return [NilClass]
- */
-static VALUE rb_llama_kv_self_update(VALUE self, VALUE ctx) {
-  if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
-    rb_raise(rb_eArgError, "ctx must be a LlamaContext");
-    return Qnil;
-  }
-  llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  llama_kv_self_update(context_wrapper->context);
-  RB_GC_GUARD(ctx);
-  return Qnil;
-}
-/**
- * @overload llama_kv_self_can_shift?(context)
- *  @param [LlamaContext] context
- *  @return [Boolean]
- */
-static VALUE rb_llama_kv_self_can_shift(VALUE self, VALUE ctx) {
-  if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
-    rb_raise(rb_eArgError, "ctx must be a LlamaContext");
-    return Qnil;
-  }
-  llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  const bool res = llama_kv_self_can_shift(context_wrapper->context);
-  RB_GC_GUARD(ctx);
-  return res ? Qtrue : Qfalse;
-}
-/**
- * @overload llama_state_get_size(context)
- *  @param [LlamaContext] context
- *  @return [Integer]
- */
-static VALUE rb_llama_state_get_size(VALUE self, VALUE ctx) {
-  if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
-    rb_raise(rb_eArgError, "ctx must be a LlamaContext");
-    return Qnil;
-  }
-  llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  const size_t size = llama_state_get_size(context_wrapper->context);
+  const size_t size = llama_state_seq_get_size(context_wrapper->context, NUM2INT(seq_id));
   RB_GC_GUARD(ctx);
   return SIZET2NUM(size);
 }
 /**
- * @overload llama_state_seq_get_size(context, seq_id)
+ * @overload llama_state_seq_get_size_ext(context, seq_id, flags)
  *  @param [LlamaContext] context
  *  @param [Integer] seq_id
+ *  @param [Integer] flags
  *  @return [Integer]
  */
-static VALUE rb_llama_state_seq_get_size(VALUE self, VALUE ctx, VALUE seq_id) {
+static VALUE rb_llama_state_seq_get_size_ext(VALUE self, VALUE ctx, VALUE seq_id, VALUE flags) {
   if (!rb_obj_is_kind_of(ctx, rb_cLlamaContext)) {
     rb_raise(rb_eArgError, "ctx must be a LlamaContext");
     return Qnil;
@@ -2523,8 +2238,12 @@ static VALUE rb_llama_state_seq_get_size(VALUE self, VALUE ctx, VALUE seq_id) {
     rb_raise(rb_eArgError, "seq_id must be an Integer");
     return Qnil;
   }
+  if (!RB_INTEGER_TYPE_P(flags)) {
+    rb_raise(rb_eArgError, "flags must be an Integer");
+    return Qnil;
+  }
   llama_context_wrapper* context_wrapper = get_llama_context_wrapper(ctx);
-  const size_t size = llama_state_seq_get_size(context_wrapper->context, NUM2INT(seq_id));
+  const size_t size = llama_state_seq_get_size_ext(context_wrapper->context, NUM2INT(seq_id), (uint32_t)NUM2UINT(flags));
   RB_GC_GUARD(ctx);
   return SIZET2NUM(size);
 }
@@ -4187,6 +3906,7 @@ void Init_llama_cpp(void) {
   rb_define_const(rb_mLlamaCpp, "LLAMA_DEFAULT_SEED", rb_str_new2(tmp));
   rb_define_const(rb_mLlamaCpp, "LLAMA_TOKEN_NULL", INT2NUM(LLAMA_TOKEN_NULL));
+  rb_define_const(rb_mLlamaCpp, "LLAMA_STATE_SEQ_FLAGS_SWA_ONLY", INT2NUM(LLAMA_STATE_SEQ_FLAGS_SWA_ONLY));
   sprintf(tmp, "0x%x", LLAMA_FILE_MAGIC_GGLA);
   rb_define_const(rb_mLlamaCpp, "LLAMA_FILE_MAGIC_GGLA", rb_str_new2(tmp));
@@ -5066,9 +4786,6 @@ void Init_llama_cpp(void) {
   /* TODO: llama_get_model */
   rb_define_module_function(rb_mLlamaCpp, "llama_get_model", rb_llama_get_model, 1);
-  /* llama_get_kv_self */
-  rb_define_module_function(rb_mLlamaCpp, "llama_get_kv_self", rb_llama_get_kv_self, 1);
   /* llama_get_memory */
   rb_define_module_function(rb_mLlamaCpp, "llama_get_memory", rb_llama_get_memory, 1);
@@ -5152,6 +4869,14 @@ void Init_llama_cpp(void) {
   /* llama_adapter_lora_init */
   rb_define_module_function(rb_mLlamaCpp, "llama_adapter_lora_init", rb_llama_adapter_lora_init, 2);
+  /* TODO: llama_adapter_meta_val_str */
+  /* llama_adapter_meta_count */
+  rb_define_module_function(rb_mLlamaCpp, "llama_adapter_meta_count", rb_llama_adapter_meta_count, 1);
+  /* TODO: llama_adapter_meta_key_by_index */
+  /* TODO: llama_adapter_meta_val_str_by_index */
   /* llama_set_adapter_lora */
   rb_define_module_function(rb_mLlamaCpp, "llama_set_adapter_lora", rb_llama_set_adapter_lora, 3);
@@ -5200,46 +4925,6 @@ void Init_llama_cpp(void) {
   /* llama_memory_can_shift */
   rb_define_module_function(rb_mLlamaCpp, "llama_memory_can_shift?", rb_llama_memory_can_shift, 1);
-  /**
-   * Document-class: LlamaCpp::LlamaKvCache
-   * "struct llama_kv_cache" wrapper class
-   */
-  rb_cLlamaKvCache = rb_define_class_under(rb_mLlamaCpp, "LlamaKvCache", rb_cObject);
-  rb_define_alloc_func(rb_cLlamaKvCache, llama_kv_cache_wrapper_alloc);
-  /* llama_kv_self_clear */
-  rb_define_module_function(rb_mLlamaCpp, "llama_kv_self_clear", rb_llama_kv_self_clear, 1);
-  /* llama_kv_self_seq_rm */
-  rb_define_module_function(rb_mLlamaCpp, "llama_kv_self_seq_rm", rb_llama_kv_self_seq_rm, 4);
-  /* llama_kv_self_seq_cp */
-  rb_define_module_function(rb_mLlamaCpp, "llama_kv_self_seq_cp", rb_llama_kv_self_seq_cp, 5);
-  /* llama_kv_self_seq_keep */
-  rb_define_module_function(rb_mLlamaCpp, "llama_kv_self_seq_keep", rb_llama_kv_self_seq_keep, 2);
-  /* llama_kv_self_seq_add */
-  rb_define_module_function(rb_mLlamaCpp, "llama_kv_self_seq_add", rb_llama_kv_self_seq_add, 5);
-  /* llama_kv_self_seq_div */
-  rb_define_module_function(rb_mLlamaCpp, "llama_kv_self_seq_div", rb_llama_kv_self_seq_div, 5);
-  /* llama_kv_self_seq_pos_min */
-  rb_define_module_function(rb_mLlamaCpp, "llama_kv_self_seq_pos_min", rb_llama_kv_self_seq_pos_min, 2);
-  /* llama_kv_self_seq_pos_max */
-  rb_define_module_function(rb_mLlamaCpp, "llama_kv_self_seq_pos_max", rb_llama_kv_self_seq_pos_max, 2);
-  /* llama_kv_self_defrag */
-  rb_define_module_function(rb_mLlamaCpp, "llama_kv_self_defrag", rb_llama_kv_self_defrag, 1);
-  /* llama_kv_self_update */
-  rb_define_module_function(rb_mLlamaCpp, "llama_kv_self_update", rb_llama_kv_self_update, 1);
-  /* llama_kv_self_can_shift */
-  rb_define_module_function(rb_mLlamaCpp, "llama_kv_self_can_shift?", rb_llama_kv_self_can_shift, 1);
   /* llama_state_get_size */
   rb_define_module_function(rb_mLlamaCpp, "llama_state_get_size", rb_llama_state_get_size, 1);
@@ -5255,6 +4940,9 @@ void Init_llama_cpp(void) {
   /* TODO: llama_state_seq_set_data */
   /* TODO: llama_state_seq_save_file */
   /* TODO: llama_state_seq_load_file */
+  rb_define_module_function(rb_mLlamaCpp, "llama_state_seq_get_size_ext", rb_llama_state_seq_get_size_ext, 3);
+  /* TODO: llama_state_seq_get_data_ext */
+  /* TODO: llama_state_seq_set_data_ext */
   /* llama_batch_get_one */
   rb_define_module_function(rb_mLlamaCpp, "llama_batch_get_one", rb_llama_batch_get_one, 1);

data/lib/llama_cpp/version.rb CHANGED Viewed

@@ -3,8 +3,8 @@
 # llama_cpp.rb provides Ruby bindings for the llama.cpp.
 module LlamaCpp
   # The version of llama_cpp.rb you install.
-  VERSION = '0.21.2'
+  VERSION = '0.22.1'
   # The supported version of llama.cpp.
-  LLAMA_CPP_VERSION = 'b6100'
+  LLAMA_CPP_VERSION = 'b6310'
 end

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: llama_cpp
 version: !ruby/object:Gem::Version
-  version: 0.21.2
+  version: 0.22.1
 platform: ruby
 authors:
 - yoshoku