RubyGems - llama_cpp - Versions diffs - 0.10.1 → 0.10.2 - Mend

llama_cpp 0.10.1 → 0.10.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +6 -0
data/ext/llama_cpp/llama_cpp.cpp +16 -1
data/ext/llama_cpp/src/ggml-alloc.c +12 -4
data/ext/llama_cpp/src/ggml-backend-impl.h +12 -8
data/ext/llama_cpp/src/ggml-backend.c +75 -5
data/ext/llama_cpp/src/ggml-backend.h +7 -0
data/ext/llama_cpp/src/ggml-cuda.cu +284 -162
data/ext/llama_cpp/src/ggml-metal.h +3 -0
data/ext/llama_cpp/src/ggml-metal.m +190 -44
data/ext/llama_cpp/src/ggml-metal.metal +11 -2
data/ext/llama_cpp/src/ggml.c +262 -89
data/ext/llama_cpp/src/ggml.h +24 -10
data/ext/llama_cpp/src/llama.cpp +926 -780
data/ext/llama_cpp/src/llama.h +8 -3
data/lib/llama_cpp/version.rb +2 -2
metadata +2 -2

data/ext/llama_cpp/src/llama.h CHANGED Viewed

@@ -39,6 +39,7 @@
 #define LLAMA_MAX_RNG_STATE (64*1024)
+#define LLAMA_FILE_MAGIC_GGLA 0x67676c61u // 'ggla'
 #define LLAMA_FILE_MAGIC_GGSN 0x6767736eu // 'ggsn'
 #define LLAMA_SESSION_MAGIC   LLAMA_FILE_MAGIC_GGSN
@@ -126,7 +127,7 @@ extern "C" {
         bool sorted;
     } llama_token_data_array;
-    typedef void (*llama_progress_callback)(float progress, void *ctx);
+    typedef bool (*llama_progress_callback)(float progress, void *ctx);
     // Input data for llama_decode
     // A llama_batch object can contain input about one or many sequences
@@ -179,7 +180,9 @@ extern "C" {
         int32_t main_gpu;     // the GPU that is used for scratch and small tensors
         const float * tensor_split; // how to split layers across multiple GPUs (size: LLAMA_MAX_DEVICES)
-        // called with a progress value between 0 and 1, pass NULL to disable
+        // Called with a progress value between 0.0 and 1.0. Pass NULL to disable.
+        // If the provided progress_callback returns true, model loading continues.
+        // If it returns false, model loading is immediately aborted.
         llama_progress_callback progress_callback;
         // context pointer passed to the progress callback
@@ -313,7 +316,9 @@ extern "C" {
     LLAMA_API const struct llama_model * llama_get_model(const struct llama_context * ctx);
-    LLAMA_API int llama_n_ctx      (const struct llama_context * ctx);
+    // TODO: become more consistent with returned int types across the API
+    LLAMA_API uint32_t llama_n_ctx      (const struct llama_context * ctx);
+    LLAMA_API uint32_t llama_n_batch    (const struct llama_context * ctx);
     LLAMA_API enum llama_vocab_type llama_vocab_type(const struct llama_model * model);

data/lib/llama_cpp/version.rb CHANGED Viewed

@@ -3,8 +3,8 @@
 # llama_cpp.rb provides Ruby bindings for the llama.cpp.
 module LLaMACpp
   # The version of llama_cpp.rb you install.
-  VERSION = '0.10.1'
+  VERSION = '0.10.2'
   # The version of llama.cpp bundled with llama_cpp.rb.
-  LLAMA_CPP_VERSION = 'b1641'
+  LLAMA_CPP_VERSION = 'b1686'
 end

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: llama_cpp
 version: !ruby/object:Gem::Version
-  version: 0.10.1
+  version: 0.10.2
 platform: ruby
 authors:
 - yoshoku
 autorequire:
 bindir: exe
 cert_chain: []
-date: 2023-12-16 00:00:00.000000000 Z
+date: 2023-12-23 00:00:00.000000000 Z
 dependencies: []
 description: llama_cpp.rb provides Ruby bindings for the llama.cpp.
 email: