kreuzberg 4.0.0.pre.rc.6 → 4.0.0.rc1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (175) hide show
  1. checksums.yaml +4 -4
  2. data/.gitignore +0 -6
  3. data/.rubocop.yaml +534 -1
  4. data/Gemfile +2 -1
  5. data/Gemfile.lock +11 -11
  6. data/README.md +5 -10
  7. data/examples/async_patterns.rb +0 -1
  8. data/ext/kreuzberg_rb/extconf.rb +0 -10
  9. data/ext/kreuzberg_rb/native/Cargo.toml +15 -23
  10. data/ext/kreuzberg_rb/native/build.rs +2 -0
  11. data/ext/kreuzberg_rb/native/include/ieeefp.h +1 -1
  12. data/ext/kreuzberg_rb/native/include/msvc_compat/strings.h +1 -1
  13. data/ext/kreuzberg_rb/native/include/strings.h +2 -2
  14. data/ext/kreuzberg_rb/native/include/unistd.h +1 -1
  15. data/ext/kreuzberg_rb/native/src/lib.rs +16 -75
  16. data/kreuzberg.gemspec +14 -57
  17. data/lib/kreuzberg/cache_api.rb +0 -1
  18. data/lib/kreuzberg/cli.rb +2 -2
  19. data/lib/kreuzberg/config.rb +2 -9
  20. data/lib/kreuzberg/errors.rb +7 -75
  21. data/lib/kreuzberg/extraction_api.rb +0 -1
  22. data/lib/kreuzberg/setup_lib_path.rb +0 -1
  23. data/lib/kreuzberg/version.rb +1 -1
  24. data/lib/kreuzberg.rb +0 -21
  25. data/pkg/kreuzberg-4.0.0.rc1.gem +0 -0
  26. data/sig/kreuzberg.rbs +3 -55
  27. data/spec/binding/cli_proxy_spec.rb +4 -2
  28. data/spec/binding/cli_spec.rb +11 -12
  29. data/spec/examples.txt +104 -0
  30. data/spec/fixtures/config.yaml +1 -0
  31. data/spec/spec_helper.rb +1 -1
  32. data/vendor/kreuzberg/Cargo.toml +42 -112
  33. data/vendor/kreuzberg/README.md +2 -2
  34. data/vendor/kreuzberg/build.rs +4 -18
  35. data/vendor/kreuzberg/src/bin/profile_extract.rs +455 -0
  36. data/vendor/kreuzberg/src/cache/mod.rs +3 -27
  37. data/vendor/kreuzberg/src/core/batch_mode.rs +0 -60
  38. data/vendor/kreuzberg/src/core/extractor.rs +81 -202
  39. data/vendor/kreuzberg/src/core/io.rs +2 -4
  40. data/vendor/kreuzberg/src/core/mime.rs +12 -2
  41. data/vendor/kreuzberg/src/core/mod.rs +1 -4
  42. data/vendor/kreuzberg/src/core/pipeline.rs +33 -111
  43. data/vendor/kreuzberg/src/embeddings.rs +16 -125
  44. data/vendor/kreuzberg/src/error.rs +1 -1
  45. data/vendor/kreuzberg/src/extraction/docx.rs +1 -1
  46. data/vendor/kreuzberg/src/extraction/image.rs +13 -13
  47. data/vendor/kreuzberg/src/extraction/libreoffice.rs +1 -0
  48. data/vendor/kreuzberg/src/extraction/mod.rs +5 -9
  49. data/vendor/kreuzberg/src/extraction/office_metadata/mod.rs +0 -2
  50. data/vendor/kreuzberg/src/extraction/pandoc/batch.rs +275 -0
  51. data/vendor/kreuzberg/src/extraction/pandoc/mime_types.rs +178 -0
  52. data/vendor/kreuzberg/src/extraction/pandoc/mod.rs +491 -0
  53. data/vendor/kreuzberg/src/extraction/pandoc/server.rs +496 -0
  54. data/vendor/kreuzberg/src/extraction/pandoc/subprocess.rs +1188 -0
  55. data/vendor/kreuzberg/src/extraction/pandoc/version.rs +162 -0
  56. data/vendor/kreuzberg/src/extractors/archive.rs +0 -21
  57. data/vendor/kreuzberg/src/extractors/docx.rs +128 -16
  58. data/vendor/kreuzberg/src/extractors/email.rs +0 -14
  59. data/vendor/kreuzberg/src/extractors/excel.rs +20 -19
  60. data/vendor/kreuzberg/src/extractors/html.rs +154 -137
  61. data/vendor/kreuzberg/src/extractors/image.rs +4 -7
  62. data/vendor/kreuzberg/src/extractors/mod.rs +9 -106
  63. data/vendor/kreuzberg/src/extractors/pandoc.rs +201 -0
  64. data/vendor/kreuzberg/src/extractors/pdf.rs +15 -12
  65. data/vendor/kreuzberg/src/extractors/pptx.rs +3 -17
  66. data/vendor/kreuzberg/src/extractors/structured.rs +0 -14
  67. data/vendor/kreuzberg/src/extractors/text.rs +5 -23
  68. data/vendor/kreuzberg/src/extractors/xml.rs +0 -7
  69. data/vendor/kreuzberg/src/keywords/rake.rs +1 -0
  70. data/vendor/kreuzberg/src/lib.rs +1 -4
  71. data/vendor/kreuzberg/src/mcp/mod.rs +1 -1
  72. data/vendor/kreuzberg/src/mcp/server.rs +3 -5
  73. data/vendor/kreuzberg/src/ocr/processor.rs +2 -18
  74. data/vendor/kreuzberg/src/pdf/error.rs +1 -1
  75. data/vendor/kreuzberg/src/pdf/table.rs +44 -17
  76. data/vendor/kreuzberg/src/pdf/text.rs +3 -0
  77. data/vendor/kreuzberg/src/plugins/extractor.rs +5 -8
  78. data/vendor/kreuzberg/src/plugins/ocr.rs +11 -2
  79. data/vendor/kreuzberg/src/plugins/processor.rs +1 -2
  80. data/vendor/kreuzberg/src/plugins/registry.rs +0 -13
  81. data/vendor/kreuzberg/src/plugins/validator.rs +8 -9
  82. data/vendor/kreuzberg/src/stopwords/mod.rs +2 -2
  83. data/vendor/kreuzberg/src/types.rs +12 -42
  84. data/vendor/kreuzberg/tests/batch_orchestration.rs +5 -19
  85. data/vendor/kreuzberg/tests/batch_processing.rs +3 -15
  86. data/vendor/kreuzberg/tests/chunking_offset_demo.rs +92 -0
  87. data/vendor/kreuzberg/tests/concurrency_stress.rs +1 -17
  88. data/vendor/kreuzberg/tests/config_features.rs +0 -18
  89. data/vendor/kreuzberg/tests/config_loading_tests.rs +39 -15
  90. data/vendor/kreuzberg/tests/core_integration.rs +7 -24
  91. data/vendor/kreuzberg/tests/csv_integration.rs +81 -71
  92. data/vendor/kreuzberg/tests/docx_metadata_extraction_test.rs +25 -23
  93. data/vendor/kreuzberg/tests/pandoc_integration.rs +503 -0
  94. data/vendor/kreuzberg/tests/pipeline_integration.rs +1 -0
  95. data/vendor/kreuzberg/tests/plugin_postprocessor_test.rs +1 -0
  96. data/vendor/kreuzberg/tests/registry_integration_tests.rs +22 -1
  97. data/vendor/kreuzberg/tests/security_validation.rs +1 -12
  98. metadata +25 -90
  99. data/.rubocop.yml +0 -538
  100. data/ext/kreuzberg_rb/native/Cargo.lock +0 -6535
  101. data/lib/kreuzberg/error_context.rb +0 -32
  102. data/vendor/kreuzberg/benches/otel_overhead.rs +0 -48
  103. data/vendor/kreuzberg/src/extraction/markdown.rs +0 -213
  104. data/vendor/kreuzberg/src/extraction/office_metadata/odt_properties.rs +0 -287
  105. data/vendor/kreuzberg/src/extractors/bibtex.rs +0 -469
  106. data/vendor/kreuzberg/src/extractors/docbook.rs +0 -502
  107. data/vendor/kreuzberg/src/extractors/epub.rs +0 -707
  108. data/vendor/kreuzberg/src/extractors/fictionbook.rs +0 -491
  109. data/vendor/kreuzberg/src/extractors/fictionbook.rs.backup2 +0 -738
  110. data/vendor/kreuzberg/src/extractors/jats.rs +0 -1051
  111. data/vendor/kreuzberg/src/extractors/jupyter.rs +0 -367
  112. data/vendor/kreuzberg/src/extractors/latex.rs +0 -652
  113. data/vendor/kreuzberg/src/extractors/markdown.rs +0 -700
  114. data/vendor/kreuzberg/src/extractors/odt.rs +0 -628
  115. data/vendor/kreuzberg/src/extractors/opml.rs +0 -634
  116. data/vendor/kreuzberg/src/extractors/orgmode.rs +0 -528
  117. data/vendor/kreuzberg/src/extractors/rst.rs +0 -576
  118. data/vendor/kreuzberg/src/extractors/rtf.rs +0 -810
  119. data/vendor/kreuzberg/src/extractors/security.rs +0 -484
  120. data/vendor/kreuzberg/src/extractors/security_tests.rs +0 -367
  121. data/vendor/kreuzberg/src/extractors/typst.rs +0 -650
  122. data/vendor/kreuzberg/src/panic_context.rs +0 -154
  123. data/vendor/kreuzberg/tests/api_extract_multipart.rs +0 -52
  124. data/vendor/kreuzberg/tests/bibtex_parity_test.rs +0 -421
  125. data/vendor/kreuzberg/tests/docbook_extractor_tests.rs +0 -498
  126. data/vendor/kreuzberg/tests/docx_vs_pandoc_comparison.rs +0 -370
  127. data/vendor/kreuzberg/tests/epub_native_extractor_tests.rs +0 -275
  128. data/vendor/kreuzberg/tests/fictionbook_extractor_tests.rs +0 -228
  129. data/vendor/kreuzberg/tests/html_table_test.rs +0 -551
  130. data/vendor/kreuzberg/tests/instrumentation_test.rs +0 -139
  131. data/vendor/kreuzberg/tests/jats_extractor_tests.rs +0 -639
  132. data/vendor/kreuzberg/tests/jupyter_extractor_tests.rs +0 -704
  133. data/vendor/kreuzberg/tests/latex_extractor_tests.rs +0 -496
  134. data/vendor/kreuzberg/tests/markdown_extractor_tests.rs +0 -490
  135. data/vendor/kreuzberg/tests/odt_extractor_tests.rs +0 -695
  136. data/vendor/kreuzberg/tests/opml_extractor_tests.rs +0 -616
  137. data/vendor/kreuzberg/tests/orgmode_extractor_tests.rs +0 -822
  138. data/vendor/kreuzberg/tests/rst_extractor_tests.rs +0 -692
  139. data/vendor/kreuzberg/tests/rtf_extractor_tests.rs +0 -776
  140. data/vendor/kreuzberg/tests/typst_behavioral_tests.rs +0 -1259
  141. data/vendor/kreuzberg/tests/typst_extractor_tests.rs +0 -647
  142. data/vendor/rb-sys/.cargo-ok +0 -1
  143. data/vendor/rb-sys/.cargo_vcs_info.json +0 -6
  144. data/vendor/rb-sys/Cargo.lock +0 -393
  145. data/vendor/rb-sys/Cargo.toml +0 -70
  146. data/vendor/rb-sys/Cargo.toml.orig +0 -57
  147. data/vendor/rb-sys/LICENSE-APACHE +0 -190
  148. data/vendor/rb-sys/LICENSE-MIT +0 -21
  149. data/vendor/rb-sys/bin/release.sh +0 -21
  150. data/vendor/rb-sys/build/features.rs +0 -108
  151. data/vendor/rb-sys/build/main.rs +0 -246
  152. data/vendor/rb-sys/build/stable_api_config.rs +0 -153
  153. data/vendor/rb-sys/build/version.rs +0 -48
  154. data/vendor/rb-sys/readme.md +0 -36
  155. data/vendor/rb-sys/src/bindings.rs +0 -21
  156. data/vendor/rb-sys/src/hidden.rs +0 -11
  157. data/vendor/rb-sys/src/lib.rs +0 -34
  158. data/vendor/rb-sys/src/macros.rs +0 -371
  159. data/vendor/rb-sys/src/memory.rs +0 -53
  160. data/vendor/rb-sys/src/ruby_abi_version.rs +0 -38
  161. data/vendor/rb-sys/src/special_consts.rs +0 -31
  162. data/vendor/rb-sys/src/stable_api/compiled.c +0 -179
  163. data/vendor/rb-sys/src/stable_api/compiled.rs +0 -257
  164. data/vendor/rb-sys/src/stable_api/ruby_2_6.rs +0 -316
  165. data/vendor/rb-sys/src/stable_api/ruby_2_7.rs +0 -316
  166. data/vendor/rb-sys/src/stable_api/ruby_3_0.rs +0 -324
  167. data/vendor/rb-sys/src/stable_api/ruby_3_1.rs +0 -317
  168. data/vendor/rb-sys/src/stable_api/ruby_3_2.rs +0 -315
  169. data/vendor/rb-sys/src/stable_api/ruby_3_3.rs +0 -326
  170. data/vendor/rb-sys/src/stable_api/ruby_3_4.rs +0 -327
  171. data/vendor/rb-sys/src/stable_api.rs +0 -261
  172. data/vendor/rb-sys/src/symbol.rs +0 -31
  173. data/vendor/rb-sys/src/tracking_allocator.rs +0 -332
  174. data/vendor/rb-sys/src/utils.rs +0 -89
  175. data/vendor/rb-sys/src/value_type.rs +0 -7
@@ -1,316 +0,0 @@
1
- use super::StableApiDefinition;
2
-
3
- use crate::ruby_rarray_flags::*;
4
- use crate::ruby_rstring_flags::*;
5
- use crate::{
6
- VALUE, debug_ruby_assert_type,
7
- internal::{RArray, RString, RTypedData},
8
- ruby_value_type::RUBY_T_DATA,
9
- value_type,
10
- };
11
- use std::{
12
- ffi::c_void,
13
- os::raw::{c_char, c_long},
14
- ptr::NonNull,
15
- time::Duration,
16
- };
17
-
18
- #[cfg(not(ruby_eq_2_6))]
19
- compile_error!("This file should only be included in Ruby 2.6 builds");
20
-
21
- pub struct Definition;
22
-
23
- impl StableApiDefinition for Definition {
24
- const VERSION_MAJOR: u32 = 2;
25
- const VERSION_MINOR: u32 = 6;
26
-
27
- #[inline]
28
- unsafe fn rstring_len(&self, obj: VALUE) -> c_long {
29
- assert!(self.type_p(obj, crate::ruby_value_type::RUBY_T_STRING));
30
- let rstring: &RString = &*(obj as *const RString);
31
- let flags = rstring.basic.flags;
32
- let is_heap = (flags & RSTRING_NOEMBED as VALUE) != 0;
33
-
34
- if !is_heap {
35
- let mut f = rstring.basic.flags;
36
- f &= RSTRING_EMBED_LEN_MASK as VALUE;
37
- f >>= RSTRING_EMBED_LEN_SHIFT as VALUE;
38
- f as c_long
39
- } else {
40
- rstring.as_.heap.len
41
- }
42
- }
43
-
44
- #[inline]
45
- unsafe fn rstring_ptr(&self, obj: VALUE) -> *const c_char {
46
- assert!(self.type_p(obj, crate::ruby_value_type::RUBY_T_STRING));
47
-
48
- let rstring: &RString = &*(obj as *const RString);
49
- let flags = rstring.basic.flags;
50
- let is_heap = (flags & RSTRING_NOEMBED as VALUE) != 0;
51
- let ptr = if !is_heap {
52
- std::ptr::addr_of!(rstring.as_.ary) as *const _
53
- } else {
54
- rstring.as_.heap.ptr
55
- };
56
-
57
- assert!(!ptr.is_null());
58
-
59
- ptr
60
- }
61
-
62
- #[inline]
63
- unsafe fn rarray_len(&self, obj: VALUE) -> c_long {
64
- assert!(self.type_p(obj, value_type::RUBY_T_ARRAY));
65
-
66
- let rarray: &RArray = &*(obj as *const RArray);
67
- let flags = rarray.basic.flags;
68
- let is_embedded = (flags & RARRAY_EMBED_FLAG as VALUE) != 0;
69
-
70
- if is_embedded {
71
- let mut f = rarray.basic.flags;
72
- f &= RARRAY_EMBED_LEN_MASK as VALUE;
73
- f >>= RARRAY_EMBED_LEN_SHIFT as VALUE;
74
- f as c_long
75
- } else {
76
- rarray.as_.heap.len
77
- }
78
- }
79
-
80
- #[inline]
81
- unsafe fn rarray_const_ptr(&self, obj: VALUE) -> *const VALUE {
82
- assert!(self.type_p(obj, value_type::RUBY_T_ARRAY));
83
-
84
- let rarray: &RArray = &*(obj as *const RArray);
85
- let flags = rarray.basic.flags;
86
- let is_embedded = (flags & RARRAY_EMBED_FLAG as VALUE) != 0;
87
- let ptr = if is_embedded {
88
- rarray.as_.ary.as_ptr()
89
- } else {
90
- rarray.as_.heap.ptr
91
- };
92
-
93
- assert!(!ptr.is_null());
94
-
95
- ptr
96
- }
97
-
98
- #[inline]
99
- unsafe fn rbasic_class(&self, obj: VALUE) -> Option<NonNull<VALUE>> {
100
- let rbasic = obj as *const crate::RBasic;
101
-
102
- NonNull::<VALUE>::new((*rbasic).klass as _)
103
- }
104
-
105
- #[inline]
106
- unsafe fn frozen_p(&self, obj: VALUE) -> bool {
107
- if self.special_const_p(obj) {
108
- true
109
- } else {
110
- let rbasic = obj as *const crate::RBasic;
111
- ((*rbasic).flags & crate::ruby_fl_type::RUBY_FL_FREEZE as VALUE) != 0
112
- }
113
- }
114
-
115
- #[inline]
116
- unsafe fn bignum_positive_p(&self, obj: VALUE) -> bool {
117
- let rbasic = obj as *const crate::RBasic;
118
-
119
- ((*rbasic).flags & crate::ruby_fl_type::RUBY_FL_USER1 as VALUE) != 0
120
- }
121
-
122
- #[inline]
123
- fn special_const_p(&self, value: VALUE) -> bool {
124
- let is_immediate = value & (crate::special_consts::IMMEDIATE_MASK as VALUE) != 0;
125
- let test = (value & !(crate::Qnil as VALUE)) != 0;
126
-
127
- is_immediate || !test
128
- }
129
-
130
- #[inline]
131
- unsafe fn builtin_type(&self, obj: VALUE) -> crate::ruby_value_type {
132
- let rbasic = obj as *const crate::RBasic;
133
- let ret: u32 = ((*rbasic).flags & crate::ruby_value_type::RUBY_T_MASK as VALUE) as _;
134
-
135
- std::mem::transmute::<_, crate::ruby_value_type>(ret)
136
- }
137
-
138
- #[inline]
139
- fn nil_p(&self, obj: VALUE) -> bool {
140
- obj == (crate::Qnil as VALUE)
141
- }
142
-
143
- #[inline]
144
- fn fixnum_p(&self, obj: VALUE) -> bool {
145
- (obj & crate::FIXNUM_FLAG as VALUE) != 0
146
- }
147
-
148
- #[inline]
149
- fn static_sym_p(&self, obj: VALUE) -> bool {
150
- let mask = !(VALUE::MAX << crate::ruby_special_consts::RUBY_SPECIAL_SHIFT as VALUE);
151
- (obj & mask) == crate::ruby_special_consts::RUBY_SYMBOL_FLAG as VALUE
152
- }
153
-
154
- #[inline]
155
- fn flonum_p(&self, obj: VALUE) -> bool {
156
- #[cfg(ruby_use_flonum = "true")]
157
- let ret = (obj & crate::FLONUM_MASK as VALUE) == crate::FLONUM_FLAG as VALUE;
158
-
159
- #[cfg(not(ruby_use_flonum = "true"))]
160
- let ret = false;
161
-
162
- ret
163
- }
164
-
165
- #[inline]
166
- fn immediate_p(&self, obj: VALUE) -> bool {
167
- (obj & crate::special_consts::IMMEDIATE_MASK as VALUE) != 0
168
- }
169
-
170
- #[inline]
171
- fn rb_test(&self, obj: VALUE) -> bool {
172
- (obj & !(crate::Qnil as VALUE)) != 0
173
- }
174
-
175
- #[inline]
176
- unsafe fn type_p(&self, obj: VALUE, t: crate::ruby_value_type) -> bool {
177
- use crate::ruby_special_consts::*;
178
- use crate::ruby_value_type::*;
179
-
180
- if t == RUBY_T_TRUE {
181
- obj == RUBY_Qtrue as _
182
- } else if t == RUBY_T_FALSE {
183
- obj == RUBY_Qfalse as _
184
- } else if t == RUBY_T_NIL {
185
- obj == RUBY_Qnil as _
186
- } else if t == RUBY_T_UNDEF {
187
- obj == RUBY_Qundef as _
188
- } else if t == RUBY_T_FIXNUM {
189
- self.fixnum_p(obj)
190
- } else if t == RUBY_T_SYMBOL {
191
- self.symbol_p(obj)
192
- } else if t == RUBY_T_FLOAT {
193
- self.float_type_p(obj)
194
- } else if self.special_const_p(obj) {
195
- false
196
- } else if t == self.builtin_type(obj) {
197
- true
198
- } else {
199
- t == self.rb_type(obj)
200
- }
201
- }
202
-
203
- unsafe fn symbol_p(&self, obj: VALUE) -> bool {
204
- self.static_sym_p(obj) || self.dynamic_sym_p(obj)
205
- }
206
-
207
- unsafe fn float_type_p(&self, obj: VALUE) -> bool {
208
- if self.flonum_p(obj) {
209
- true
210
- } else if self.special_const_p(obj) {
211
- false
212
- } else {
213
- self.builtin_type(obj) == value_type::RUBY_T_FLOAT
214
- }
215
- }
216
-
217
- unsafe fn rb_type(&self, obj: VALUE) -> crate::ruby_value_type {
218
- use crate::ruby_special_consts::*;
219
- use crate::ruby_value_type::*;
220
-
221
- if !self.special_const_p(obj) {
222
- self.builtin_type(obj)
223
- } else if obj == RUBY_Qfalse as _ {
224
- RUBY_T_FALSE
225
- } else if obj == RUBY_Qnil as _ {
226
- RUBY_T_NIL
227
- } else if obj == RUBY_Qtrue as _ {
228
- RUBY_T_TRUE
229
- } else if obj == RUBY_Qundef as _ {
230
- RUBY_T_UNDEF
231
- } else if self.fixnum_p(obj) {
232
- RUBY_T_FIXNUM
233
- } else if self.static_sym_p(obj) {
234
- RUBY_T_SYMBOL
235
- } else {
236
- debug_assert!(self.flonum_p(obj));
237
- RUBY_T_FLOAT
238
- }
239
- }
240
-
241
- unsafe fn dynamic_sym_p(&self, obj: VALUE) -> bool {
242
- if self.special_const_p(obj) {
243
- false
244
- } else {
245
- self.builtin_type(obj) == value_type::RUBY_T_SYMBOL
246
- }
247
- }
248
-
249
- #[inline]
250
- unsafe fn integer_type_p(&self, obj: VALUE) -> bool {
251
- if self.fixnum_p(obj) {
252
- true
253
- } else if self.special_const_p(obj) {
254
- false
255
- } else {
256
- self.builtin_type(obj) == value_type::RUBY_T_BIGNUM
257
- }
258
- }
259
-
260
- #[inline]
261
- unsafe fn rstring_interned_p(&self, obj: VALUE) -> bool {
262
- assert!(self.type_p(obj, value_type::RUBY_T_STRING));
263
-
264
- let rstring: &RString = &*(obj as *const RString);
265
- let flags = rstring.basic.flags;
266
-
267
- (flags & crate::ruby_rstring_flags::RSTRING_FSTR as VALUE) != 0
268
- }
269
-
270
- #[inline]
271
- fn thread_sleep(&self, duration: Duration) {
272
- let seconds = duration.as_secs() as _;
273
- let microseconds = duration.subsec_micros() as _;
274
-
275
- let time = crate::timeval {
276
- tv_sec: seconds,
277
- tv_usec: microseconds,
278
- };
279
-
280
- unsafe { crate::rb_thread_wait_for(time) }
281
- }
282
-
283
- #[inline]
284
- unsafe fn rtypeddata_p(&self, obj: VALUE) -> bool {
285
- debug_ruby_assert_type!(obj, RUBY_T_DATA, "rtypeddata_p called on non-T_DATA object");
286
-
287
- // Access the RTypedData struct
288
- let rdata = obj as *const RTypedData;
289
- let typed_flag = (*rdata).typed_flag;
290
- // Valid typed_flag value for Ruby 2.6 is only 1
291
- typed_flag == 1
292
- }
293
-
294
- #[inline]
295
- unsafe fn rtypeddata_embedded_p(&self, _obj: VALUE) -> bool {
296
- // Ruby 2.6 doesn't support embedded data
297
- false
298
- }
299
-
300
- #[inline]
301
- unsafe fn rtypeddata_type(&self, obj: VALUE) -> *const crate::rb_data_type_t {
302
- debug_ruby_assert_type!(obj, RUBY_T_DATA, "rtypeddata_type called on non-T_DATA object");
303
-
304
- let rdata = obj as *const RTypedData;
305
- (*rdata).type_
306
- }
307
-
308
- #[inline]
309
- unsafe fn rtypeddata_get_data(&self, obj: VALUE) -> *mut c_void {
310
- debug_ruby_assert_type!(obj, RUBY_T_DATA, "rtypeddata_get_data called on non-T_DATA object");
311
-
312
- // For Ruby 2.6, simply return the data field
313
- let rdata = obj as *const RTypedData;
314
- (*rdata).data
315
- }
316
- }
@@ -1,316 +0,0 @@
1
- use super::StableApiDefinition;
2
- use crate::{
3
- VALUE, debug_ruby_assert_type,
4
- internal::{RArray, RString, RTypedData},
5
- ruby_value_type::RUBY_T_DATA,
6
- value_type,
7
- };
8
- use std::{
9
- ffi::c_void,
10
- os::raw::{c_char, c_long},
11
- ptr::NonNull,
12
- time::Duration,
13
- };
14
-
15
- #[cfg(not(ruby_eq_2_7))]
16
- compile_error!("This file should only be included in Ruby 2.7 builds");
17
-
18
- pub struct Definition;
19
-
20
- impl StableApiDefinition for Definition {
21
- const VERSION_MAJOR: u32 = 2;
22
- const VERSION_MINOR: u32 = 7;
23
-
24
- #[inline]
25
- unsafe fn rstring_len(&self, obj: VALUE) -> c_long {
26
- assert!(self.type_p(obj, crate::ruby_value_type::RUBY_T_STRING));
27
-
28
- let rstring: &RString = &*(obj as *const RString);
29
- let flags = rstring.basic.flags;
30
- let is_heap = (flags & crate::ruby_rstring_flags::RSTRING_NOEMBED as VALUE) != 0;
31
-
32
- if !is_heap {
33
- use crate::ruby_rstring_flags::RSTRING_EMBED_LEN_SHIFT;
34
-
35
- let mut f = rstring.basic.flags;
36
- f &= crate::ruby_rstring_flags::RSTRING_EMBED_LEN_MASK as VALUE;
37
- f >>= RSTRING_EMBED_LEN_SHIFT as VALUE;
38
- f as c_long
39
- } else {
40
- rstring.as_.heap.len
41
- }
42
- }
43
-
44
- #[inline]
45
- unsafe fn rstring_ptr(&self, obj: VALUE) -> *const c_char {
46
- assert!(self.type_p(obj, crate::ruby_value_type::RUBY_T_STRING));
47
-
48
- let rstring: &RString = &*(obj as *const RString);
49
- let flags = rstring.basic.flags;
50
- let is_heap = (flags & crate::ruby_rstring_flags::RSTRING_NOEMBED as VALUE) != 0;
51
- let ptr = if !is_heap {
52
- std::ptr::addr_of!(rstring.as_.ary) as *const _
53
- } else {
54
- rstring.as_.heap.ptr
55
- };
56
-
57
- assert!(!ptr.is_null());
58
-
59
- ptr
60
- }
61
-
62
- #[inline]
63
- unsafe fn rarray_len(&self, obj: VALUE) -> c_long {
64
- assert!(self.type_p(obj, value_type::RUBY_T_ARRAY));
65
-
66
- let rarray: &RArray = &*(obj as *const RArray);
67
- let flags = rarray.basic.flags;
68
- let is_embedded = (flags & crate::ruby_rarray_flags::RARRAY_EMBED_FLAG as VALUE) != 0;
69
-
70
- if is_embedded {
71
- let mut f = rarray.basic.flags;
72
- f &= crate::ruby_rarray_flags::RARRAY_EMBED_LEN_MASK as VALUE;
73
- f >>= crate::ruby_rarray_flags::RARRAY_EMBED_LEN_SHIFT as VALUE;
74
- f as c_long
75
- } else {
76
- rarray.as_.heap.len
77
- }
78
- }
79
-
80
- #[inline]
81
- unsafe fn rarray_const_ptr(&self, obj: VALUE) -> *const VALUE {
82
- assert!(self.type_p(obj, value_type::RUBY_T_ARRAY));
83
-
84
- let rarray: &RArray = &*(obj as *const RArray);
85
- let flags = rarray.basic.flags;
86
- let is_embedded = (flags & crate::ruby_rarray_flags::RARRAY_EMBED_FLAG as VALUE) != 0;
87
- let ptr = if is_embedded {
88
- std::ptr::addr_of!(rarray.as_.ary) as *const _
89
- } else {
90
- rarray.as_.heap.ptr
91
- };
92
-
93
- assert!(!ptr.is_null());
94
-
95
- ptr
96
- }
97
-
98
- #[inline]
99
- unsafe fn rbasic_class(&self, obj: VALUE) -> Option<NonNull<VALUE>> {
100
- let rbasic = obj as *const crate::RBasic;
101
-
102
- NonNull::<VALUE>::new((*rbasic).klass as _)
103
- }
104
-
105
- #[inline]
106
- unsafe fn frozen_p(&self, obj: VALUE) -> bool {
107
- if self.special_const_p(obj) {
108
- true
109
- } else {
110
- let rbasic = obj as *const crate::RBasic;
111
- ((*rbasic).flags & crate::ruby_fl_type::RUBY_FL_FREEZE as VALUE) != 0
112
- }
113
- }
114
-
115
- #[inline]
116
- unsafe fn bignum_positive_p(&self, obj: VALUE) -> bool {
117
- let rbasic = obj as *const crate::RBasic;
118
-
119
- ((*rbasic).flags & crate::ruby_fl_type::RUBY_FL_USER1 as VALUE) != 0
120
- }
121
-
122
- #[inline]
123
- fn special_const_p(&self, value: VALUE) -> bool {
124
- let is_immediate = value & (crate::special_consts::IMMEDIATE_MASK as VALUE) != 0;
125
- let test = (value & !(crate::Qnil as VALUE)) != 0;
126
-
127
- is_immediate || !test
128
- }
129
-
130
- #[inline]
131
- unsafe fn builtin_type(&self, obj: VALUE) -> crate::ruby_value_type {
132
- let rbasic = obj as *const crate::RBasic;
133
- let ret: u32 = ((*rbasic).flags & crate::ruby_value_type::RUBY_T_MASK as VALUE) as _;
134
-
135
- std::mem::transmute::<_, crate::ruby_value_type>(ret)
136
- }
137
-
138
- #[inline]
139
- fn nil_p(&self, obj: VALUE) -> bool {
140
- obj == (crate::Qnil as VALUE)
141
- }
142
-
143
- #[inline]
144
- fn fixnum_p(&self, obj: VALUE) -> bool {
145
- (obj & crate::FIXNUM_FLAG as VALUE) != 0
146
- }
147
-
148
- #[inline]
149
- fn static_sym_p(&self, obj: VALUE) -> bool {
150
- let mask = !(VALUE::MAX << crate::ruby_special_consts::RUBY_SPECIAL_SHIFT as VALUE);
151
- (obj & mask) == crate::ruby_special_consts::RUBY_SYMBOL_FLAG as VALUE
152
- }
153
-
154
- #[inline]
155
- fn flonum_p(&self, obj: VALUE) -> bool {
156
- #[cfg(ruby_use_flonum = "true")]
157
- let ret = (obj & crate::FLONUM_MASK as VALUE) == crate::FLONUM_FLAG as VALUE;
158
-
159
- #[cfg(not(ruby_use_flonum = "true"))]
160
- let ret = false;
161
-
162
- ret
163
- }
164
-
165
- #[inline]
166
- fn immediate_p(&self, obj: VALUE) -> bool {
167
- (obj & crate::special_consts::IMMEDIATE_MASK as VALUE) != 0
168
- }
169
-
170
- #[inline]
171
- fn rb_test(&self, obj: VALUE) -> bool {
172
- (obj & !(crate::Qnil as VALUE)) != 0
173
- }
174
-
175
- #[inline]
176
- unsafe fn type_p(&self, obj: VALUE, t: crate::ruby_value_type) -> bool {
177
- use crate::ruby_special_consts::*;
178
- use crate::ruby_value_type::*;
179
-
180
- if t == RUBY_T_TRUE {
181
- obj == RUBY_Qtrue as _
182
- } else if t == RUBY_T_FALSE {
183
- obj == RUBY_Qfalse as _
184
- } else if t == RUBY_T_NIL {
185
- obj == RUBY_Qnil as _
186
- } else if t == RUBY_T_UNDEF {
187
- obj == RUBY_Qundef as _
188
- } else if t == RUBY_T_FIXNUM {
189
- self.fixnum_p(obj)
190
- } else if t == RUBY_T_SYMBOL {
191
- self.symbol_p(obj)
192
- } else if t == RUBY_T_FLOAT {
193
- self.float_type_p(obj)
194
- } else if self.special_const_p(obj) {
195
- false
196
- } else if t == self.builtin_type(obj) {
197
- true
198
- } else {
199
- t == self.rb_type(obj)
200
- }
201
- }
202
-
203
- unsafe fn symbol_p(&self, obj: VALUE) -> bool {
204
- self.static_sym_p(obj) || self.dynamic_sym_p(obj)
205
- }
206
-
207
- unsafe fn float_type_p(&self, obj: VALUE) -> bool {
208
- if self.flonum_p(obj) {
209
- true
210
- } else if self.special_const_p(obj) {
211
- false
212
- } else {
213
- self.builtin_type(obj) == value_type::RUBY_T_FLOAT
214
- }
215
- }
216
-
217
- unsafe fn rb_type(&self, obj: VALUE) -> crate::ruby_value_type {
218
- use crate::ruby_special_consts::*;
219
- use crate::ruby_value_type::*;
220
-
221
- if !self.special_const_p(obj) {
222
- self.builtin_type(obj)
223
- } else if obj == RUBY_Qfalse as _ {
224
- RUBY_T_FALSE
225
- } else if obj == RUBY_Qnil as _ {
226
- RUBY_T_NIL
227
- } else if obj == RUBY_Qtrue as _ {
228
- RUBY_T_TRUE
229
- } else if obj == RUBY_Qundef as _ {
230
- RUBY_T_UNDEF
231
- } else if self.fixnum_p(obj) {
232
- RUBY_T_FIXNUM
233
- } else if self.static_sym_p(obj) {
234
- RUBY_T_SYMBOL
235
- } else {
236
- debug_assert!(self.flonum_p(obj));
237
- RUBY_T_FLOAT
238
- }
239
- }
240
-
241
- unsafe fn dynamic_sym_p(&self, obj: VALUE) -> bool {
242
- if self.special_const_p(obj) {
243
- false
244
- } else {
245
- self.builtin_type(obj) == value_type::RUBY_T_SYMBOL
246
- }
247
- }
248
-
249
- #[inline]
250
- unsafe fn integer_type_p(&self, obj: VALUE) -> bool {
251
- if self.fixnum_p(obj) {
252
- true
253
- } else if self.special_const_p(obj) {
254
- false
255
- } else {
256
- self.builtin_type(obj) == value_type::RUBY_T_BIGNUM
257
- }
258
- }
259
-
260
- #[inline]
261
- unsafe fn rstring_interned_p(&self, obj: VALUE) -> bool {
262
- assert!(self.type_p(obj, value_type::RUBY_T_STRING));
263
-
264
- let rstring: &RString = &*(obj as *const RString);
265
- let flags = rstring.basic.flags;
266
-
267
- (flags & crate::ruby_rstring_flags::RSTRING_FSTR as VALUE) != 0
268
- }
269
-
270
- #[inline]
271
- fn thread_sleep(&self, duration: Duration) {
272
- let seconds = duration.as_secs() as _;
273
- let microseconds = duration.subsec_micros() as _;
274
-
275
- let time = crate::timeval {
276
- tv_sec: seconds,
277
- tv_usec: microseconds,
278
- };
279
-
280
- unsafe { crate::rb_thread_wait_for(time) }
281
- }
282
-
283
- #[inline]
284
- unsafe fn rtypeddata_p(&self, obj: VALUE) -> bool {
285
- debug_ruby_assert_type!(obj, RUBY_T_DATA, "rtypeddata_p called on non-T_DATA object");
286
-
287
- // Access the RTypedData struct
288
- let rdata = obj as *const RTypedData;
289
- let typed_flag = (*rdata).typed_flag;
290
- // Valid typed_flag value for Ruby 2.7 is only 1
291
- typed_flag == 1
292
- }
293
-
294
- #[inline]
295
- unsafe fn rtypeddata_embedded_p(&self, _obj: VALUE) -> bool {
296
- // Ruby 2.7 doesn't support embedded data
297
- false
298
- }
299
-
300
- #[inline]
301
- unsafe fn rtypeddata_type(&self, obj: VALUE) -> *const crate::rb_data_type_t {
302
- debug_ruby_assert_type!(obj, RUBY_T_DATA, "rtypeddata_type called on non-T_DATA object");
303
-
304
- let rdata = obj as *const RTypedData;
305
- (*rdata).type_
306
- }
307
-
308
- #[inline]
309
- unsafe fn rtypeddata_get_data(&self, obj: VALUE) -> *mut c_void {
310
- debug_ruby_assert_type!(obj, RUBY_T_DATA, "rtypeddata_get_data called on non-T_DATA object");
311
-
312
- // For Ruby 2.7, simply return the data field
313
- let rdata = obj as *const RTypedData;
314
- (*rdata).data
315
- }
316
- }