red-candle 1.0.0.pre.1 → 1.0.0.pre.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 34ca4771af8508ace5ee8df5d5111a407c79fea307f9fbc2b72d9e46d6dd2099
4
- data.tar.gz: 39a316c2990f8766257e07c5ae8803ba852aebc5c93b14349548b1da82b6ae4a
3
+ metadata.gz: 375ffec5c2293170bdb0e78ffe2584c8a963968d3226b601d12ddcc040c256ec
4
+ data.tar.gz: ea2490c59eca2480728afb7169fc3a24f4270e63491648c1d09fd111707dcb7e
5
5
  SHA512:
6
- metadata.gz: 51fcc58936f25818485bacd5dfc86911ca1ecbc0a8b87f6fdcf2d015a91faccd6aeb889df33a931eae6d864984254ab4a81ab7050fb00caf14d090820cf4d86b
7
- data.tar.gz: f6e58cc4e723c12e3d290fcb45b1cab5923594bfd011be223ec327c65c7c91cb7d37f9330ed82eadd4b7eb3085ef0ba9b874a6b98c15221b21c60cd01de11418
6
+ metadata.gz: 9011c72cbe2a065917f26774862bb1f82489e6d5354376cb616df7cea18646ca60ccd5e68282f39b23f89eead196ab41ce70cdaaca224f97aef61914559f653f
7
+ data.tar.gz: 4a48101bdcffeecd1bc687dacc7eee7dc42ddbb417b05cce57b97abad83cefe90d965be5c0a8256b8f5c9ba90d80f1159c5392097558acf93a3095913a68a2ad
data/Gemfile ADDED
@@ -0,0 +1,12 @@
1
+ source "https://rubygems.org"
2
+
3
+ gemspec
4
+
5
+ gem "minitest"
6
+ gem "rake"
7
+ gem "rake-compiler"
8
+
9
+ gem "yard", require: false
10
+ gem "yard-rustdoc", require: false
11
+
12
+ gem "redcarpet", "~> 3.6"
data/LICENSE ADDED
@@ -0,0 +1,22 @@
1
+ MIT License
2
+
3
+ Copyright (c) 2023 kojix2
4
+ Copyright (c) 2024 Christopher Petersen
5
+
6
+ Permission is hereby granted, free of charge, to any person obtaining a copy
7
+ of this software and associated documentation files (the "Software"), to deal
8
+ in the Software without restriction, including without limitation the rights
9
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10
+ copies of the Software, and to permit persons to whom the Software is
11
+ furnished to do so, subject to the following conditions:
12
+
13
+ The above copyright notice and this permission notice shall be included in all
14
+ copies or substantial portions of the Software.
15
+
16
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22
+ SOFTWARE.
data/Rakefile ADDED
@@ -0,0 +1,95 @@
1
+ # frozen_string_literal: true
2
+
3
+ require "bundler/gem_tasks"
4
+ require "rake/testtask"
5
+ require "rake/extensiontask"
6
+
7
+ ENV['CANDLE_TEST_SKIP_LLM'] = 'true'
8
+
9
+ task default: :test
10
+ Rake::TestTask.new do |t|
11
+ t.deps << :compile
12
+ t.libs << "test"
13
+ t.test_files = FileList["test/**/*_test.rb"]
14
+ end
15
+
16
+ spec = Bundler.load_gemspec("candle.gemspec")
17
+ Rake::ExtensionTask.new("candle", spec) do |c|
18
+ c.lib_dir = "lib/candle"
19
+ c.cross_compile = true
20
+ c.cross_platform = %w[
21
+ aarch64-linux
22
+ arm64-darwin
23
+ x64-mingw-ucrt
24
+ x64-mingw32
25
+ x86_64-darwin
26
+ x86_64-linux
27
+ x86_64-linux-musl
28
+ ]
29
+ end
30
+
31
+ desc "Run device compatibility tests"
32
+ Rake::TestTask.new("test:device") do |t|
33
+ t.deps << :compile
34
+ t.libs << "test"
35
+ t.test_files = FileList["test/device_compatibility_test.rb"]
36
+ t.verbose = true
37
+ end
38
+
39
+ desc "Run benchmark tests"
40
+ Rake::TestTask.new("test:benchmark") do |t|
41
+ ENV['CANDLE_RUN_BENCHMARKS'] = 'true'
42
+ t.deps << :compile
43
+ t.libs << "test"
44
+ t.test_files = FileList["test/benchmarks/**/*_test.rb"]
45
+ t.verbose = true
46
+ end
47
+
48
+ desc "Run all tests including benchmarks"
49
+ task "test:all" => [:test, "test:benchmark"]
50
+
51
+ desc "Run tests on specific devices"
52
+ namespace :test do
53
+ %w[cpu metal cuda].each do |device|
54
+ desc "Run tests on #{device.upcase} only"
55
+ task "device:#{device}" => :compile do
56
+ ENV['CANDLE_TEST_DEVICES'] = device
57
+ Rake::Task["test:device"].invoke
58
+ end
59
+ end
60
+ end
61
+
62
+ desc "Run benchmarks with device tests"
63
+ task "test:device:benchmark" => :compile do
64
+ ENV['CANDLE_RUN_BENCHMARKS'] = 'true'
65
+ ENV['CANDLE_TEST_VERBOSE'] = 'true'
66
+ Rake::Task["test:device"].invoke
67
+ Rake::Task["test:benchmark"].invoke
68
+ end
69
+
70
+ namespace :doc do
71
+ task default: %i[rustdoc yard]
72
+
73
+ desc "Generate YARD documentation"
74
+ task :yard do
75
+ sh <<~CMD
76
+ yard doc \
77
+ --plugin rustdoc -- lib tmp/doc/candle.json
78
+ CMD
79
+ end
80
+
81
+ desc "Generate Rust documentation as JSON"
82
+ task :rustdoc do
83
+ sh <<~CMD
84
+ cargo +nightly rustdoc \
85
+ --target-dir tmp/doc/target \
86
+ -p candle \
87
+ -- -Zunstable-options --output-format json \
88
+ --document-private-items
89
+ CMD
90
+
91
+ cp "tmp/doc/target/doc/candle.json", "tmp/doc/candle.json"
92
+ end
93
+ end
94
+
95
+ task doc: "doc:default"
data/bin/console ADDED
@@ -0,0 +1,11 @@
1
+ #!/usr/bin/env ruby
2
+ # frozen_string_literal: true
3
+
4
+ require "bundler/setup"
5
+ require "candle"
6
+
7
+ # You can add fixtures and/or initialization code here to make experimenting
8
+ # with your gem easier. You can also use a different console, if you like.
9
+
10
+ require "irb"
11
+ IRB.start(__FILE__)
data/bin/setup ADDED
@@ -0,0 +1,17 @@
1
+ #!/usr/bin/env bash
2
+ set -euo pipefail
3
+ IFS=$'\n\t'
4
+ set -vx
5
+
6
+ # Check if Rust is installed
7
+ if ! command -v cargo &> /dev/null
8
+ then
9
+ echo "Rust is not installed. Please install Rust: https://www.rust-lang.org/tools/install"
10
+ exit 1
11
+ fi
12
+
13
+ # Install Ruby dependencies
14
+ bundle install
15
+
16
+ # Build Rust extension
17
+ bundle exec rake compile
@@ -0,0 +1,63 @@
1
+ max_width = 100
2
+ hard_tabs = false
3
+ tab_spaces = 4
4
+ newline_style = "Auto"
5
+ use_small_heuristics = "Default"
6
+ indent_style = "Block"
7
+ wrap_comments = false
8
+ format_code_in_doc_comments = false
9
+ comment_width = 80
10
+ normalize_comments = false
11
+ normalize_doc_attributes = false
12
+ format_strings = false
13
+ format_macro_matchers = false
14
+ format_macro_bodies = true
15
+ empty_item_single_line = true
16
+ struct_lit_single_line = true
17
+ fn_single_line = false
18
+ where_single_line = false
19
+ imports_indent = "Block"
20
+ imports_layout = "Mixed"
21
+ imports_granularity="Crate"
22
+ reorder_imports = true
23
+ reorder_modules = true
24
+ reorder_impl_items = false
25
+ type_punctuation_density = "Wide"
26
+ space_before_colon = false
27
+ space_after_colon = true
28
+ spaces_around_ranges = false
29
+ binop_separator = "Front"
30
+ remove_nested_parens = true
31
+ combine_control_expr = true
32
+ overflow_delimited_expr = false
33
+ struct_field_align_threshold = 0
34
+ enum_discrim_align_threshold = 0
35
+ match_arm_blocks = true
36
+ force_multiline_blocks = false
37
+ fn_params_layout = "Tall"
38
+ brace_style = "SameLineWhere"
39
+ control_brace_style = "AlwaysSameLine"
40
+ trailing_semicolon = true
41
+ trailing_comma = "Vertical"
42
+ match_block_trailing_comma = false
43
+ blank_lines_upper_bound = 1
44
+ blank_lines_lower_bound = 0
45
+ edition = "2021"
46
+ version = "One"
47
+ inline_attribute_width = 0
48
+ merge_derives = true
49
+ use_try_shorthand = false
50
+ use_field_init_shorthand = false
51
+ force_explicit_abi = true
52
+ condense_wildcard_suffixes = false
53
+ color = "Auto"
54
+ #required_version = "1.4.12"
55
+ unstable_features = false
56
+ disable_all_formatting = false
57
+ skip_children = false
58
+ hide_parse_errors = false
59
+ error_on_line_overflow = false
60
+ error_on_unformatted = false
61
+ ignore = []
62
+ emit_mode = "Files"
63
+ make_backup = false
@@ -1,7 +1,7 @@
1
- use magnus::{function, method, prelude::*, Ruby};
1
+ use magnus::{function, prelude::*, Ruby};
2
2
 
3
3
  use crate::ruby::candle_utils;
4
- use crate::ruby::{DType, Device, QTensor, Result as RbResult, Tensor};
4
+ use crate::ruby::Result as RbResult;
5
5
 
6
6
  pub mod llm;
7
7
  pub mod reranker;
@@ -42,101 +42,11 @@ fn init(ruby: &Ruby) -> RbResult<()> {
42
42
  ruby::init_embedding_model(rb_candle)?;
43
43
  ruby::init_llm(rb_candle)?;
44
44
  reranker::init(rb_candle)?;
45
+ ruby::dtype::init(rb_candle)?;
46
+ ruby::qtensor::init(rb_candle)?;
47
+ ruby::device::init(rb_candle)?;
48
+ ruby::tensor::init(rb_candle)?;
45
49
  candle_utils(rb_candle)?;
46
- let rb_tensor = rb_candle.define_class("Tensor", Ruby::class_object(ruby))?;
47
- rb_tensor.define_singleton_method("new", function!(Tensor::new, 3))?;
48
- // rb_tensor.define_singleton_method("cat", function!(Tensor::cat, 2))?;
49
- // rb_tensor.define_singleton_method("stack", function!(Tensor::stack, 2))?;
50
- rb_tensor.define_singleton_method("rand", function!(Tensor::rand, 2))?;
51
- rb_tensor.define_singleton_method("randn", function!(Tensor::randn, 2))?;
52
- rb_tensor.define_singleton_method("ones", function!(Tensor::ones, 2))?;
53
- rb_tensor.define_singleton_method("zeros", function!(Tensor::zeros, 2))?;
54
- rb_tensor.define_method("values", method!(Tensor::values, 0))?;
55
- rb_tensor.define_method("values_f32", method!(Tensor::values_f32, 0))?;
56
- rb_tensor.define_method("item", method!(Tensor::item, 0))?;
57
- rb_tensor.define_method("shape", method!(Tensor::shape, 0))?;
58
- rb_tensor.define_method("stride", method!(Tensor::stride, 0))?;
59
- rb_tensor.define_method("dtype", method!(Tensor::dtype, 0))?;
60
- rb_tensor.define_method("device", method!(Tensor::device, 0))?;
61
- rb_tensor.define_method("rank", method!(Tensor::rank, 0))?;
62
- rb_tensor.define_method("elem_count", method!(Tensor::elem_count, 0))?;
63
- rb_tensor.define_method("sin", method!(Tensor::sin, 0))?;
64
- rb_tensor.define_method("cos", method!(Tensor::cos, 0))?;
65
- rb_tensor.define_method("log", method!(Tensor::log, 0))?;
66
- rb_tensor.define_method("sqr", method!(Tensor::sqr, 0))?;
67
- rb_tensor.define_method("mean", method!(Tensor::mean, 1))?;
68
- rb_tensor.define_method("sum", method!(Tensor::sum, 1))?;
69
- rb_tensor.define_method("sqrt", method!(Tensor::sqrt, 0))?;
70
- rb_tensor.define_method("/", method!(Tensor::__truediv__, 1))?; // Accepts Tensor, Float, or Integer
71
- rb_tensor.define_method("recip", method!(Tensor::recip, 0))?;
72
- rb_tensor.define_method("exp", method!(Tensor::exp, 0))?;
73
- rb_tensor.define_method("powf", method!(Tensor::powf, 1))?;
74
- rb_tensor.define_method("index_select", method!(Tensor::index_select, 2))?;
75
- rb_tensor.define_method("matmul", method!(Tensor::matmul, 1))?;
76
- rb_tensor.define_method("broadcast_add", method!(Tensor::broadcast_add, 1))?;
77
- rb_tensor.define_method("broadcast_sub", method!(Tensor::broadcast_sub, 1))?;
78
- rb_tensor.define_method("broadcast_mul", method!(Tensor::broadcast_mul, 1))?;
79
- rb_tensor.define_method("broadcast_div", method!(Tensor::broadcast_div, 1))?;
80
- rb_tensor.define_method("where_cond", method!(Tensor::where_cond, 2))?;
81
- rb_tensor.define_method("+", method!(Tensor::__add__, 1))?;
82
- rb_tensor.define_method("*", method!(Tensor::__mul__, 1))?;
83
- rb_tensor.define_method("-", method!(Tensor::__sub__, 1))?;
84
- rb_tensor.define_method("reshape", method!(Tensor::reshape, 1))?;
85
- rb_tensor.define_method("broadcast_as", method!(Tensor::broadcast_as, 1))?;
86
- rb_tensor.define_method("broadcast_left", method!(Tensor::broadcast_left, 1))?;
87
- rb_tensor.define_method("squeeze", method!(Tensor::squeeze, 1))?;
88
- rb_tensor.define_method("unsqueeze", method!(Tensor::unsqueeze, 1))?;
89
- rb_tensor.define_method("get", method!(Tensor::get, 1))?;
90
- rb_tensor.define_method("[]", method!(Tensor::get, 1))?;
91
- rb_tensor.define_method("transpose", method!(Tensor::transpose, 2))?;
92
- rb_tensor.define_method("narrow", method!(Tensor::narrow, 3))?;
93
- rb_tensor.define_method("argmax_keepdim", method!(Tensor::argmax_keepdim, 1))?;
94
- rb_tensor.define_method("argmin_keepdim", method!(Tensor::argmin_keepdim, 1))?;
95
- rb_tensor.define_method("max_keepdim", method!(Tensor::max_keepdim, 1))?;
96
- rb_tensor.define_method("min_keepdim", method!(Tensor::min_keepdim, 1))?;
97
- // rb_tensor.define_method("eq", method!(Tensor::eq, 1))?;
98
- // rb_tensor.define_method("ne", method!(Tensor::ne, 1))?;
99
- // rb_tensor.define_method("lt", method!(Tensor::lt, 1))?;
100
- // rb_tensor.define_method("gt", method!(Tensor::gt, 1))?;
101
- // rb_tensor.define_method("ge", method!(Tensor::ge, 1))?;
102
- // rb_tensor.define_method("le", method!(Tensor::le, 1))?;
103
- rb_tensor.define_method("sum_all", method!(Tensor::sum_all, 0))?;
104
- rb_tensor.define_method("mean_all", method!(Tensor::mean_all, 0))?;
105
- rb_tensor.define_method("flatten_from", method!(Tensor::flatten_from, 1))?;
106
- rb_tensor.define_method("flatten_to", method!(Tensor::flatten_to, 1))?;
107
- rb_tensor.define_method("flatten_all", method!(Tensor::flatten_all, 0))?;
108
- rb_tensor.define_method("t", method!(Tensor::t, 0))?;
109
- rb_tensor.define_method("contiguous", method!(Tensor::contiguous, 0))?;
110
- rb_tensor.define_method("is_contiguous", method!(Tensor::is_contiguous, 0))?;
111
- rb_tensor.define_method(
112
- "is_fortran_contiguous",
113
- method!(Tensor::is_fortran_contiguous, 0),
114
- )?;
115
- rb_tensor.define_method("detach", method!(Tensor::detach, 0))?;
116
- rb_tensor.define_method("copy", method!(Tensor::copy, 0))?;
117
- rb_tensor.define_method("to_dtype", method!(Tensor::to_dtype, 1))?;
118
- rb_tensor.define_method("to_device", method!(Tensor::to_device, 1))?;
119
- rb_tensor.define_method("to_s", method!(Tensor::__str__, 0))?;
120
- rb_tensor.define_method("inspect", method!(Tensor::__repr__, 0))?;
121
-
122
- let rb_dtype = rb_candle.define_class("DType", Ruby::class_object(ruby))?;
123
- rb_dtype.define_method("to_s", method!(DType::__str__, 0))?;
124
- rb_dtype.define_method("inspect", method!(DType::__repr__, 0))?;
125
-
126
- let rb_device = rb_candle.define_class("Device", Ruby::class_object(ruby))?;
127
- rb_device.define_singleton_method("cpu", function!(Device::cpu, 0))?;
128
- rb_device.define_singleton_method("cuda", function!(Device::cuda, 0))?;
129
- rb_device.define_singleton_method("metal", function!(Device::metal, 0))?;
130
- rb_device.define_singleton_method("available_devices", function!(ruby::device::available_devices, 0))?;
131
- rb_device.define_singleton_method("default", function!(ruby::device::default_device, 0))?;
132
- rb_device.define_method("to_s", method!(Device::__str__, 0))?;
133
- rb_device.define_method("inspect", method!(Device::__repr__, 0))?;
134
-
135
- let rb_qtensor = rb_candle.define_class("QTensor", Ruby::class_object(ruby))?;
136
- rb_qtensor.define_method("ggml_dtype", method!(QTensor::ggml_dtype, 0))?;
137
- rb_qtensor.define_method("rank", method!(QTensor::rank, 0))?;
138
- rb_qtensor.define_method("shape", method!(QTensor::shape, 0))?;
139
- rb_qtensor.define_method("dequantize", method!(QTensor::dequantize, 0))?;
140
50
 
141
51
  Ok(())
142
52
  }
@@ -0,0 +1,49 @@
1
+ use std::time::{SystemTime, UNIX_EPOCH};
2
+
3
+ /// Configuration for text generation
4
+ #[derive(Debug, Clone)]
5
+ pub struct GenerationConfig {
6
+ /// The maximum number of tokens to generate
7
+ pub max_length: usize,
8
+ /// The temperature for sampling
9
+ pub temperature: f64,
10
+ /// The top-p value for nucleus sampling
11
+ pub top_p: Option<f64>,
12
+ /// The top-k value for top-k sampling
13
+ pub top_k: Option<usize>,
14
+ /// The repetition penalty
15
+ pub repetition_penalty: f32,
16
+ /// The repetition penalty range
17
+ pub repetition_penalty_last_n: usize,
18
+ /// Random seed for sampling
19
+ pub seed: u64,
20
+ /// Stop sequences
21
+ pub stop_sequences: Vec<String>,
22
+ /// Whether to return the prompt in the output
23
+ pub include_prompt: bool,
24
+ }
25
+
26
+ /// Generate a random seed based on current time
27
+ fn random_seed() -> u64 {
28
+ SystemTime::now()
29
+ .duration_since(UNIX_EPOCH)
30
+ .map(|d| d.as_nanos() as u64)
31
+ .unwrap_or(42)
32
+ }
33
+
34
+ impl Default for GenerationConfig {
35
+ fn default() -> Self {
36
+ Self {
37
+ max_length: 512,
38
+ temperature: 0.7,
39
+ top_p: None,
40
+ top_k: None,
41
+ repetition_penalty: 1.1,
42
+ repetition_penalty_last_n: 64,
43
+ seed: random_seed(),
44
+ stop_sequences: vec![],
45
+ include_prompt: false,
46
+ }
47
+ }
48
+ }
49
+