@lix-js/sdk 0.6.0-preview.0 → 0.6.0-preview.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (196) hide show
  1. package/README.md +9 -0
  2. package/SKILL.md +468 -0
  3. package/dist/engine-wasm/index.d.ts +15 -11
  4. package/dist/engine-wasm/index.js +105 -38
  5. package/dist/engine-wasm/wasm/lix_engine.d.ts +14 -2
  6. package/dist/engine-wasm/wasm/lix_engine.js +18 -17
  7. package/dist/engine-wasm/wasm/lix_engine.wasm +0 -0
  8. package/dist/engine-wasm/wasm/lix_engine.wasm.d.ts +2 -1
  9. package/dist/generated/builtin-schemas.d.ts +31 -41
  10. package/dist/generated/builtin-schemas.js +52 -56
  11. package/dist/open-lix.d.ts +141 -24
  12. package/dist/open-lix.js +199 -35
  13. package/dist/sqlite/index.js +99 -22
  14. package/dist-engine-src/README.md +18 -0
  15. package/dist-engine-src/src/backend/kv.rs +358 -0
  16. package/dist-engine-src/src/backend/mod.rs +12 -0
  17. package/dist-engine-src/src/backend/testing.rs +658 -0
  18. package/dist-engine-src/src/backend/types.rs +96 -0
  19. package/dist-engine-src/src/binary_cas/chunking.rs +31 -0
  20. package/dist-engine-src/src/binary_cas/codec.rs +346 -0
  21. package/dist-engine-src/src/binary_cas/context.rs +139 -0
  22. package/dist-engine-src/src/binary_cas/kv.rs +1063 -0
  23. package/dist-engine-src/src/binary_cas/mod.rs +11 -0
  24. package/dist-engine-src/src/binary_cas/types.rs +127 -0
  25. package/dist-engine-src/src/cel/context.rs +86 -0
  26. package/dist-engine-src/src/cel/error.rs +19 -0
  27. package/dist-engine-src/src/cel/mod.rs +8 -0
  28. package/dist-engine-src/src/cel/provider.rs +9 -0
  29. package/dist-engine-src/src/cel/runtime.rs +167 -0
  30. package/dist-engine-src/src/cel/value.rs +50 -0
  31. package/dist-engine-src/src/changelog/codec.rs +321 -0
  32. package/dist-engine-src/src/changelog/context.rs +92 -0
  33. package/dist-engine-src/src/changelog/materialization.rs +121 -0
  34. package/dist-engine-src/src/changelog/mod.rs +13 -0
  35. package/dist-engine-src/src/changelog/reader.rs +20 -0
  36. package/dist-engine-src/src/changelog/storage.rs +220 -0
  37. package/dist-engine-src/src/changelog/types.rs +38 -0
  38. package/dist-engine-src/src/commit_graph/context.rs +1588 -0
  39. package/dist-engine-src/src/commit_graph/mod.rs +12 -0
  40. package/dist-engine-src/src/commit_graph/types.rs +145 -0
  41. package/dist-engine-src/src/commit_graph/walker.rs +780 -0
  42. package/dist-engine-src/src/common/error.rs +313 -0
  43. package/dist-engine-src/src/common/fingerprint.rs +3 -0
  44. package/dist-engine-src/src/common/fs_path.rs +1336 -0
  45. package/dist-engine-src/src/common/identity.rs +135 -0
  46. package/dist-engine-src/src/common/metadata.rs +35 -0
  47. package/dist-engine-src/src/common/mod.rs +23 -0
  48. package/dist-engine-src/src/common/types.rs +105 -0
  49. package/dist-engine-src/src/common/wire.rs +222 -0
  50. package/dist-engine-src/src/engine.rs +239 -0
  51. package/dist-engine-src/src/entity_identity.rs +285 -0
  52. package/dist-engine-src/src/functions/context.rs +327 -0
  53. package/dist-engine-src/src/functions/deterministic.rs +113 -0
  54. package/dist-engine-src/src/functions/mod.rs +18 -0
  55. package/dist-engine-src/src/functions/provider.rs +130 -0
  56. package/dist-engine-src/src/functions/state.rs +363 -0
  57. package/dist-engine-src/src/functions/types.rs +37 -0
  58. package/dist-engine-src/src/init.rs +505 -0
  59. package/dist-engine-src/src/json_store/compression.rs +77 -0
  60. package/dist-engine-src/src/json_store/context.rs +129 -0
  61. package/dist-engine-src/src/json_store/encoded.rs +15 -0
  62. package/dist-engine-src/src/json_store/mod.rs +9 -0
  63. package/dist-engine-src/src/json_store/store.rs +236 -0
  64. package/dist-engine-src/src/json_store/types.rs +52 -0
  65. package/dist-engine-src/src/lib.rs +61 -0
  66. package/dist-engine-src/src/live_state/context.rs +2241 -0
  67. package/dist-engine-src/src/live_state/mod.rs +15 -0
  68. package/dist-engine-src/src/live_state/overlay.rs +75 -0
  69. package/dist-engine-src/src/live_state/reader.rs +23 -0
  70. package/dist-engine-src/src/live_state/types.rs +239 -0
  71. package/dist-engine-src/src/live_state/visibility.rs +218 -0
  72. package/dist-engine-src/src/plugin/archive.rs +441 -0
  73. package/dist-engine-src/src/plugin/component.rs +183 -0
  74. package/dist-engine-src/src/plugin/install.rs +637 -0
  75. package/dist-engine-src/src/plugin/manifest.rs +516 -0
  76. package/dist-engine-src/src/plugin/materializer.rs +477 -0
  77. package/dist-engine-src/src/plugin/mod.rs +33 -0
  78. package/dist-engine-src/src/plugin/plugin_manifest.json +119 -0
  79. package/dist-engine-src/src/plugin/storage.rs +74 -0
  80. package/dist-engine-src/src/schema/annotations/defaults.rs +280 -0
  81. package/dist-engine-src/src/schema/annotations/mod.rs +1 -0
  82. package/dist-engine-src/src/schema/builtin/lix_account.json +22 -0
  83. package/dist-engine-src/src/schema/builtin/lix_active_account.json +30 -0
  84. package/dist-engine-src/src/schema/builtin/lix_binary_blob_ref.json +30 -0
  85. package/dist-engine-src/src/schema/builtin/lix_change.json +62 -0
  86. package/dist-engine-src/src/schema/builtin/lix_change_author.json +46 -0
  87. package/dist-engine-src/src/schema/builtin/lix_change_set.json +18 -0
  88. package/dist-engine-src/src/schema/builtin/lix_change_set_element.json +75 -0
  89. package/dist-engine-src/src/schema/builtin/lix_commit.json +62 -0
  90. package/dist-engine-src/src/schema/builtin/lix_commit_edge.json +46 -0
  91. package/dist-engine-src/src/schema/builtin/lix_directory_descriptor.json +53 -0
  92. package/dist-engine-src/src/schema/builtin/lix_entity_label.json +63 -0
  93. package/dist-engine-src/src/schema/builtin/lix_file_descriptor.json +53 -0
  94. package/dist-engine-src/src/schema/builtin/lix_key_value.json +41 -0
  95. package/dist-engine-src/src/schema/builtin/lix_label.json +22 -0
  96. package/dist-engine-src/src/schema/builtin/lix_registered_schema.json +31 -0
  97. package/dist-engine-src/src/schema/builtin/lix_version_descriptor.json +35 -0
  98. package/dist-engine-src/src/schema/builtin/lix_version_ref.json +49 -0
  99. package/dist-engine-src/src/schema/builtin/mod.rs +271 -0
  100. package/dist-engine-src/src/schema/definition.json +157 -0
  101. package/dist-engine-src/src/schema/definition.rs +636 -0
  102. package/dist-engine-src/src/schema/key.rs +206 -0
  103. package/dist-engine-src/src/schema/mod.rs +20 -0
  104. package/dist-engine-src/src/schema/seed.rs +14 -0
  105. package/dist-engine-src/src/schema/tests.rs +739 -0
  106. package/dist-engine-src/src/schema_registry.rs +294 -0
  107. package/dist-engine-src/src/session/context.rs +366 -0
  108. package/dist-engine-src/src/session/create_version.rs +80 -0
  109. package/dist-engine-src/src/session/execute.rs +447 -0
  110. package/dist-engine-src/src/session/merge/analysis.rs +102 -0
  111. package/dist-engine-src/src/session/merge/apply.rs +23 -0
  112. package/dist-engine-src/src/session/merge/conflicts.rs +62 -0
  113. package/dist-engine-src/src/session/merge/mod.rs +11 -0
  114. package/dist-engine-src/src/session/merge/stats.rs +65 -0
  115. package/dist-engine-src/src/session/merge/version.rs +437 -0
  116. package/dist-engine-src/src/session/mod.rs +25 -0
  117. package/dist-engine-src/src/session/switch_version.rs +121 -0
  118. package/dist-engine-src/src/sql2/change_provider.rs +337 -0
  119. package/dist-engine-src/src/sql2/classify.rs +147 -0
  120. package/dist-engine-src/src/sql2/commit_derived_provider.rs +591 -0
  121. package/dist-engine-src/src/sql2/context.rs +307 -0
  122. package/dist-engine-src/src/sql2/directory_history_provider.rs +623 -0
  123. package/dist-engine-src/src/sql2/directory_provider.rs +2405 -0
  124. package/dist-engine-src/src/sql2/dml.rs +148 -0
  125. package/dist-engine-src/src/sql2/entity_history_provider.rs +444 -0
  126. package/dist-engine-src/src/sql2/entity_provider.rs +2700 -0
  127. package/dist-engine-src/src/sql2/error.rs +196 -0
  128. package/dist-engine-src/src/sql2/execute.rs +3379 -0
  129. package/dist-engine-src/src/sql2/file_history_provider.rs +902 -0
  130. package/dist-engine-src/src/sql2/file_provider.rs +3254 -0
  131. package/dist-engine-src/src/sql2/filesystem_planner.rs +1526 -0
  132. package/dist-engine-src/src/sql2/filesystem_predicates.rs +159 -0
  133. package/dist-engine-src/src/sql2/filesystem_visibility.rs +369 -0
  134. package/dist-engine-src/src/sql2/history_projection.rs +80 -0
  135. package/dist-engine-src/src/sql2/history_provider.rs +418 -0
  136. package/dist-engine-src/src/sql2/history_route.rs +643 -0
  137. package/dist-engine-src/src/sql2/lix_state_provider.rs +2430 -0
  138. package/dist-engine-src/src/sql2/mod.rs +43 -0
  139. package/dist-engine-src/src/sql2/read_only.rs +65 -0
  140. package/dist-engine-src/src/sql2/record_batch.rs +17 -0
  141. package/dist-engine-src/src/sql2/result_metadata.rs +29 -0
  142. package/dist-engine-src/src/sql2/runtime.rs +60 -0
  143. package/dist-engine-src/src/sql2/session.rs +135 -0
  144. package/dist-engine-src/src/sql2/udfs/common.rs +295 -0
  145. package/dist-engine-src/src/sql2/udfs/lix_active_version_commit_id.rs +53 -0
  146. package/dist-engine-src/src/sql2/udfs/lix_empty_blob.rs +47 -0
  147. package/dist-engine-src/src/sql2/udfs/lix_json.rs +100 -0
  148. package/dist-engine-src/src/sql2/udfs/lix_json_get.rs +99 -0
  149. package/dist-engine-src/src/sql2/udfs/lix_json_get_text.rs +99 -0
  150. package/dist-engine-src/src/sql2/udfs/lix_text_decode.rs +82 -0
  151. package/dist-engine-src/src/sql2/udfs/lix_text_encode.rs +85 -0
  152. package/dist-engine-src/src/sql2/udfs/lix_uuid_v7.rs +76 -0
  153. package/dist-engine-src/src/sql2/udfs/mod.rs +82 -0
  154. package/dist-engine-src/src/sql2/version_provider.rs +1187 -0
  155. package/dist-engine-src/src/sql2/version_scope.rs +394 -0
  156. package/dist-engine-src/src/sql2/write_normalization.rs +345 -0
  157. package/dist-engine-src/src/storage/context.rs +356 -0
  158. package/dist-engine-src/src/storage/mod.rs +14 -0
  159. package/dist-engine-src/src/storage/read_scope.rs +88 -0
  160. package/dist-engine-src/src/storage/types.rs +501 -0
  161. package/dist-engine-src/src/storage_bench.rs +3406 -0
  162. package/dist-engine-src/src/test_support.rs +81 -0
  163. package/dist-engine-src/src/tracked_state/by_file_index.rs +102 -0
  164. package/dist-engine-src/src/tracked_state/codec.rs +747 -0
  165. package/dist-engine-src/src/tracked_state/context.rs +983 -0
  166. package/dist-engine-src/src/tracked_state/diff.rs +494 -0
  167. package/dist-engine-src/src/tracked_state/materialization.rs +141 -0
  168. package/dist-engine-src/src/tracked_state/merge.rs +474 -0
  169. package/dist-engine-src/src/tracked_state/mod.rs +31 -0
  170. package/dist-engine-src/src/tracked_state/rebuild.rs +771 -0
  171. package/dist-engine-src/src/tracked_state/storage.rs +243 -0
  172. package/dist-engine-src/src/tracked_state/tree.rs +2744 -0
  173. package/dist-engine-src/src/tracked_state/tree_types.rs +176 -0
  174. package/dist-engine-src/src/tracked_state/types.rs +61 -0
  175. package/dist-engine-src/src/transaction/commit.rs +1224 -0
  176. package/dist-engine-src/src/transaction/context.rs +1307 -0
  177. package/dist-engine-src/src/transaction/live_state_overlay.rs +34 -0
  178. package/dist-engine-src/src/transaction/mod.rs +11 -0
  179. package/dist-engine-src/src/transaction/normalization.rs +1026 -0
  180. package/dist-engine-src/src/transaction/schema_resolver.rs +127 -0
  181. package/dist-engine-src/src/transaction/staging.rs +1436 -0
  182. package/dist-engine-src/src/transaction/types.rs +351 -0
  183. package/dist-engine-src/src/transaction/validation.rs +4811 -0
  184. package/dist-engine-src/src/untracked_state/codec.rs +363 -0
  185. package/dist-engine-src/src/untracked_state/context.rs +82 -0
  186. package/dist-engine-src/src/untracked_state/materialization.rs +157 -0
  187. package/dist-engine-src/src/untracked_state/mod.rs +17 -0
  188. package/dist-engine-src/src/untracked_state/storage.rs +348 -0
  189. package/dist-engine-src/src/untracked_state/types.rs +96 -0
  190. package/dist-engine-src/src/version/context.rs +52 -0
  191. package/dist-engine-src/src/version/mod.rs +12 -0
  192. package/dist-engine-src/src/version/refs.rs +421 -0
  193. package/dist-engine-src/src/version/stage_rows.rs +71 -0
  194. package/dist-engine-src/src/version/types.rs +21 -0
  195. package/dist-engine-src/src/wasm/mod.rs +60 -0
  196. package/package.json +68 -63
@@ -0,0 +1,345 @@
1
+ use std::collections::{BTreeMap, BTreeSet};
2
+ use std::sync::Arc;
3
+
4
+ use datafusion::arrow::array::ArrayRef;
5
+ use datafusion::arrow::datatypes::DataType;
6
+ use datafusion::arrow::record_batch::RecordBatch;
7
+ use datafusion::common::{DataFusionError, Result, ScalarValue};
8
+ use datafusion::logical_expr::Expr;
9
+ use datafusion::physical_expr::expressions::{CastExpr, Literal};
10
+ use datafusion::physical_expr::PhysicalExpr;
11
+ use datafusion::physical_plan::projection::ProjectionExec;
12
+ use datafusion::physical_plan::ExecutionPlan;
13
+
14
+ use crate::LixError;
15
+
16
+ #[derive(Debug, Clone)]
17
+ pub(crate) enum SqlCell {
18
+ Null,
19
+ Value(ScalarValue),
20
+ }
21
+
22
+ impl SqlCell {
23
+ pub(crate) fn from_scalar(value: ScalarValue) -> Self {
24
+ if value.is_null() {
25
+ Self::Null
26
+ } else {
27
+ Self::Value(value)
28
+ }
29
+ }
30
+ }
31
+
32
+ #[derive(Debug, Clone)]
33
+ pub(crate) enum InsertCell {
34
+ Omitted,
35
+ Provided(SqlCell),
36
+ }
37
+
38
+ #[derive(Debug, Clone)]
39
+ pub(crate) enum UpdateCell {
40
+ Unassigned,
41
+ Assigned(SqlCell),
42
+ }
43
+
44
+ #[derive(Debug, Clone)]
45
+ pub(crate) struct InsertColumnIntents {
46
+ explicit_columns: Option<BTreeSet<String>>,
47
+ }
48
+
49
+ impl InsertColumnIntents {
50
+ pub(crate) fn all_explicit() -> Self {
51
+ Self {
52
+ explicit_columns: None,
53
+ }
54
+ }
55
+
56
+ pub(crate) fn from_input(input: &Arc<dyn ExecutionPlan>) -> Self {
57
+ let Some(projection) = input.as_any().downcast_ref::<ProjectionExec>() else {
58
+ return Self {
59
+ explicit_columns: None,
60
+ };
61
+ };
62
+
63
+ let explicit_columns = projection
64
+ .expr()
65
+ .iter()
66
+ .filter(|expr| !is_generated_null_default(expr.expr.as_ref()))
67
+ .map(|expr| expr.alias.clone())
68
+ .collect();
69
+
70
+ Self {
71
+ explicit_columns: Some(explicit_columns),
72
+ }
73
+ }
74
+
75
+ pub(crate) fn includes_column(&self, column_name: &str) -> bool {
76
+ self.explicit_columns
77
+ .as_ref()
78
+ .is_none_or(|columns| columns.contains(column_name))
79
+ }
80
+
81
+ pub(crate) fn cell(
82
+ &self,
83
+ batch: &RecordBatch,
84
+ row_index: usize,
85
+ column_name: &str,
86
+ ) -> Result<InsertCell> {
87
+ if !self.includes_column(column_name) {
88
+ return Ok(InsertCell::Omitted);
89
+ }
90
+
91
+ optional_scalar_value(batch, row_index, column_name).map(|value| match value {
92
+ None => InsertCell::Omitted,
93
+ Some(value) => InsertCell::Provided(SqlCell::from_scalar(value)),
94
+ })
95
+ }
96
+ }
97
+
98
+ pub(crate) fn reject_non_binary_casts_for_insert_column(
99
+ input: &Arc<dyn ExecutionPlan>,
100
+ column_name: &str,
101
+ context: &str,
102
+ ) -> Result<()> {
103
+ reject_non_binary_casts_for_insert_column_in_plan(input.as_ref(), column_name, context)
104
+ }
105
+
106
+ fn reject_non_binary_casts_for_insert_column_in_plan(
107
+ input: &dyn ExecutionPlan,
108
+ column_name: &str,
109
+ context: &str,
110
+ ) -> Result<()> {
111
+ let Some(projection) = input.as_any().downcast_ref::<ProjectionExec>() else {
112
+ for child in input.children() {
113
+ reject_non_binary_casts_for_insert_column_in_plan(
114
+ child.as_ref(),
115
+ column_name,
116
+ context,
117
+ )?;
118
+ }
119
+ return Ok(());
120
+ };
121
+
122
+ let Some(expr) = projection
123
+ .expr()
124
+ .iter()
125
+ .find(|expr| expr.alias == column_name)
126
+ else {
127
+ return Ok(());
128
+ };
129
+
130
+ if contains_non_binary_cast_to_binary(expr.expr.as_ref()) {
131
+ return Err(super::error::lix_error_to_datafusion_error(
132
+ LixError::new(
133
+ LixError::CODE_TYPE_MISMATCH,
134
+ format!("{context} expected binary column '{column_name}'"),
135
+ )
136
+ .with_hint("Use X'...' or a binary parameter for file contents."),
137
+ ));
138
+ }
139
+
140
+ Ok(())
141
+ }
142
+
143
+ fn contains_non_binary_cast_to_binary(expr: &dyn PhysicalExpr) -> bool {
144
+ let Some(cast) = expr.as_any().downcast_ref::<CastExpr>() else {
145
+ return false;
146
+ };
147
+
148
+ if is_binary_type(cast.cast_type()) && !physical_expr_is_binary_or_null(cast.expr().as_ref()) {
149
+ return true;
150
+ }
151
+
152
+ contains_non_binary_cast_to_binary(cast.expr().as_ref())
153
+ }
154
+
155
+ fn physical_expr_is_binary_or_null(expr: &dyn PhysicalExpr) -> bool {
156
+ if let Some(literal) = expr.as_any().downcast_ref::<Literal>() {
157
+ return scalar_is_binary_or_null(literal.value());
158
+ }
159
+
160
+ if let Some(cast) = expr.as_any().downcast_ref::<CastExpr>() {
161
+ return is_binary_type(cast.cast_type())
162
+ && physical_expr_is_binary_or_null(cast.expr().as_ref());
163
+ }
164
+
165
+ false
166
+ }
167
+
168
+ pub(crate) fn scalar_is_binary_or_null(value: &ScalarValue) -> bool {
169
+ value.is_null()
170
+ || matches!(
171
+ value,
172
+ ScalarValue::Binary(_)
173
+ | ScalarValue::LargeBinary(_)
174
+ | ScalarValue::FixedSizeBinary(_, _)
175
+ )
176
+ }
177
+
178
+ pub(crate) fn logical_expr_is_binary_or_null(expr: &Expr) -> bool {
179
+ match expr {
180
+ Expr::Literal(value, _) => scalar_is_binary_or_null(value),
181
+ Expr::Cast(cast) => {
182
+ is_binary_type(&cast.data_type) && logical_expr_is_binary_or_null(&cast.expr)
183
+ }
184
+ Expr::Alias(alias) => logical_expr_is_binary_or_null(&alias.expr),
185
+ _ => false,
186
+ }
187
+ }
188
+
189
+ pub(crate) fn is_binary_type(data_type: &DataType) -> bool {
190
+ matches!(
191
+ data_type,
192
+ DataType::Binary | DataType::LargeBinary | DataType::FixedSizeBinary(_)
193
+ )
194
+ }
195
+
196
+ pub(crate) fn lix_file_data_type_lix_error() -> LixError {
197
+ LixError::new(
198
+ LixError::CODE_TYPE_MISMATCH,
199
+ "lix_file.data expects binary data",
200
+ )
201
+ .with_hint("Use X'...' or a binary parameter for file contents.")
202
+ }
203
+
204
+ pub(crate) fn lix_file_data_type_error(
205
+ context: &str,
206
+ column_name: &str,
207
+ instruction: &str,
208
+ ) -> DataFusionError {
209
+ super::error::lix_error_to_datafusion_error(
210
+ LixError::new(
211
+ LixError::CODE_TYPE_MISMATCH,
212
+ format!("{context} expected binary column '{column_name}'"),
213
+ )
214
+ .with_hint(instruction),
215
+ )
216
+ }
217
+
218
+ pub(crate) fn lix_file_data_type_error_with_value(
219
+ context: &str,
220
+ column_name: &str,
221
+ value: &ScalarValue,
222
+ instruction: &str,
223
+ ) -> DataFusionError {
224
+ super::error::lix_error_to_datafusion_error(
225
+ LixError::new(
226
+ LixError::CODE_TYPE_MISMATCH,
227
+ format!("{context} expected binary column '{column_name}', got {value:?}"),
228
+ )
229
+ .with_hint(instruction),
230
+ )
231
+ }
232
+
233
+ pub(crate) struct UpdateAssignmentValues {
234
+ values: BTreeMap<String, ArrayRef>,
235
+ }
236
+
237
+ impl UpdateAssignmentValues {
238
+ pub(crate) fn evaluate(
239
+ batch: &RecordBatch,
240
+ assignments: &[(String, Arc<dyn PhysicalExpr>)],
241
+ ) -> Result<Self> {
242
+ let mut values = BTreeMap::new();
243
+ for (column_name, assignment) in assignments {
244
+ values.insert(
245
+ column_name.clone(),
246
+ assignment.evaluate(batch)?.into_array(batch.num_rows())?,
247
+ );
248
+ }
249
+ Ok(Self { values })
250
+ }
251
+
252
+ #[cfg(test)]
253
+ pub(crate) fn from_batch_columns(batch: &RecordBatch, columns: &[&str]) -> Self {
254
+ let values = columns
255
+ .iter()
256
+ .filter_map(|column_name| {
257
+ let column_index = batch.schema().index_of(column_name).ok()?;
258
+ Some((
259
+ (*column_name).to_string(),
260
+ Arc::clone(batch.column(column_index)),
261
+ ))
262
+ })
263
+ .collect();
264
+ Self { values }
265
+ }
266
+
267
+ /// Returns only the value explicitly assigned by SQL UPDATE.
268
+ ///
269
+ /// Use this for document-patch semantics where `Unassigned` must remain
270
+ /// distinct from `Assigned(NULL)`.
271
+ pub(crate) fn assigned_cell(&self, row_index: usize, column_name: &str) -> Result<UpdateCell> {
272
+ let Some(array) = self.values.get(column_name) else {
273
+ return Ok(UpdateCell::Unassigned);
274
+ };
275
+
276
+ ScalarValue::try_from_array(array.as_ref(), row_index)
277
+ .map(SqlCell::from_scalar)
278
+ .map(UpdateCell::Assigned)
279
+ .map_err(|error| {
280
+ DataFusionError::Execution(format!(
281
+ "failed to decode SQL UPDATE assignment for column '{column_name}' at row {row_index}: {error}"
282
+ ))
283
+ })
284
+ }
285
+
286
+ /// Returns the assigned SQL UPDATE value, or falls back to the existing row
287
+ /// column value when the column was not assigned.
288
+ ///
289
+ /// Use this for scalar row-column semantics. Do not use it to reconstruct
290
+ /// JSON documents from projected property columns, because projection can
291
+ /// erase the difference between an absent property and an explicit null.
292
+ pub(crate) fn assigned_or_existing_cell(
293
+ &self,
294
+ batch: &RecordBatch,
295
+ row_index: usize,
296
+ column_name: &str,
297
+ ) -> Result<InsertCell> {
298
+ match self.assigned_cell(row_index, column_name)? {
299
+ UpdateCell::Assigned(value) => Ok(InsertCell::Provided(value)),
300
+ UpdateCell::Unassigned => {
301
+ optional_scalar_value(batch, row_index, column_name).map(|value| match value {
302
+ None => InsertCell::Omitted,
303
+ Some(value) => InsertCell::Provided(SqlCell::from_scalar(value)),
304
+ })
305
+ }
306
+ }
307
+ }
308
+ }
309
+
310
+ pub(crate) fn optional_scalar_value(
311
+ batch: &RecordBatch,
312
+ row_index: usize,
313
+ column_name: &str,
314
+ ) -> Result<Option<ScalarValue>> {
315
+ let schema = batch.schema();
316
+ let column_index = match schema.index_of(column_name) {
317
+ Ok(column_index) => column_index,
318
+ Err(_) => return Ok(None),
319
+ };
320
+ if row_index >= batch.num_rows() {
321
+ return Err(DataFusionError::Execution(format!(
322
+ "row index {row_index} out of bounds for SQL write batch with {} rows",
323
+ batch.num_rows()
324
+ )));
325
+ }
326
+ ScalarValue::try_from_array(batch.column(column_index).as_ref(), row_index)
327
+ .map(Some)
328
+ .map_err(|error| {
329
+ DataFusionError::Execution(format!(
330
+ "failed to decode SQL write column '{column_name}' at row {row_index}: {error}"
331
+ ))
332
+ })
333
+ }
334
+
335
+ fn is_generated_null_default(expr: &dyn PhysicalExpr) -> bool {
336
+ if let Some(literal) = expr.as_any().downcast_ref::<Literal>() {
337
+ return literal.value().is_null();
338
+ }
339
+
340
+ if let Some(cast) = expr.as_any().downcast_ref::<CastExpr>() {
341
+ return is_generated_null_default(cast.expr().as_ref());
342
+ }
343
+
344
+ false
345
+ }
@@ -0,0 +1,356 @@
1
+ use std::sync::Arc;
2
+
3
+ use async_trait::async_trait;
4
+
5
+ use crate::backend::{Backend, BackendReadTransaction, BackendWriteTransaction};
6
+ use crate::storage::types::{KvWriteBatch, StorageWriter};
7
+ use crate::storage::{
8
+ KvEntryPage, KvExistsBatch, KvGetRequest, KvKeyPage, KvScanRequest, KvValueBatch, KvValuePage,
9
+ KvWriteStats, StorageReadTransaction, StorageReader, StorageWriteTransaction,
10
+ };
11
+ use crate::LixError;
12
+
13
+ #[derive(Clone)]
14
+ pub(crate) struct StorageContext {
15
+ backend: Arc<dyn Backend + Send + Sync>,
16
+ }
17
+
18
+ impl StorageContext {
19
+ pub(crate) fn new(backend: Arc<dyn Backend + Send + Sync>) -> Self {
20
+ Self { backend }
21
+ }
22
+
23
+ pub(crate) async fn begin_read_transaction(
24
+ &self,
25
+ ) -> Result<Box<dyn StorageReadTransaction + Send + Sync + 'static>, LixError> {
26
+ let transaction = self.backend.begin_read_transaction().await?;
27
+ Ok(Box::new(StorageContextReadTransaction { transaction }))
28
+ }
29
+
30
+ pub(crate) async fn begin_write_transaction(
31
+ &self,
32
+ ) -> Result<Box<dyn StorageWriteTransaction + Send + Sync + 'static>, LixError> {
33
+ let transaction = self.backend.begin_write_transaction().await?;
34
+ Ok(Box::new(StorageContextWriteTransaction { transaction }))
35
+ }
36
+
37
+ pub(crate) async fn close(&self) -> Result<(), LixError> {
38
+ self.backend.close().await
39
+ }
40
+
41
+ pub(crate) async fn destroy(&self) -> Result<(), LixError> {
42
+ self.backend.destroy().await
43
+ }
44
+ }
45
+
46
+ #[cfg(any(test, feature = "storage-benches"))]
47
+ #[async_trait]
48
+ impl StorageReader for StorageContext {
49
+ async fn get_values(&mut self, request: KvGetRequest) -> Result<KvValueBatch, LixError> {
50
+ let mut transaction = self.begin_read_transaction().await?;
51
+ let result = transaction.get_values(request).await;
52
+ match result {
53
+ Ok(result) => {
54
+ transaction.rollback().await?;
55
+ Ok(result)
56
+ }
57
+ Err(error) => {
58
+ let _ = transaction.rollback().await;
59
+ Err(error)
60
+ }
61
+ }
62
+ }
63
+
64
+ async fn exists_many(&mut self, request: KvGetRequest) -> Result<KvExistsBatch, LixError> {
65
+ let mut transaction = self.begin_read_transaction().await?;
66
+ let result = transaction.exists_many(request).await;
67
+ match result {
68
+ Ok(result) => {
69
+ transaction.rollback().await?;
70
+ Ok(result)
71
+ }
72
+ Err(error) => {
73
+ let _ = transaction.rollback().await;
74
+ Err(error)
75
+ }
76
+ }
77
+ }
78
+
79
+ async fn scan_keys(&mut self, request: KvScanRequest) -> Result<KvKeyPage, LixError> {
80
+ let mut transaction = self.begin_read_transaction().await?;
81
+ let result = transaction.scan_keys(request).await;
82
+ match result {
83
+ Ok(result) => {
84
+ transaction.rollback().await?;
85
+ Ok(result)
86
+ }
87
+ Err(error) => {
88
+ let _ = transaction.rollback().await;
89
+ Err(error)
90
+ }
91
+ }
92
+ }
93
+
94
+ async fn scan_values(&mut self, request: KvScanRequest) -> Result<KvValuePage, LixError> {
95
+ let mut transaction = self.begin_read_transaction().await?;
96
+ let result = transaction.scan_values(request).await;
97
+ match result {
98
+ Ok(result) => {
99
+ transaction.rollback().await?;
100
+ Ok(result)
101
+ }
102
+ Err(error) => {
103
+ let _ = transaction.rollback().await;
104
+ Err(error)
105
+ }
106
+ }
107
+ }
108
+
109
+ async fn scan_entries(&mut self, request: KvScanRequest) -> Result<KvEntryPage, LixError> {
110
+ let mut transaction = self.begin_read_transaction().await?;
111
+ let result = transaction.scan_entries(request).await;
112
+ match result {
113
+ Ok(result) => {
114
+ transaction.rollback().await?;
115
+ Ok(result)
116
+ }
117
+ Err(error) => {
118
+ let _ = transaction.rollback().await;
119
+ Err(error)
120
+ }
121
+ }
122
+ }
123
+ }
124
+
125
+ struct StorageContextReadTransaction {
126
+ transaction: Box<dyn BackendReadTransaction + Send + Sync + 'static>,
127
+ }
128
+
129
+ struct StorageContextWriteTransaction {
130
+ transaction: Box<dyn BackendWriteTransaction + Send + Sync + 'static>,
131
+ }
132
+
133
+ #[async_trait]
134
+ impl StorageReader for StorageContextReadTransaction {
135
+ async fn get_values(&mut self, request: KvGetRequest) -> Result<KvValueBatch, LixError> {
136
+ self.transaction
137
+ .get_values(request.into())
138
+ .await
139
+ .map(Into::into)
140
+ }
141
+
142
+ async fn exists_many(&mut self, request: KvGetRequest) -> Result<KvExistsBatch, LixError> {
143
+ self.transaction
144
+ .exists_many(request.into())
145
+ .await
146
+ .map(Into::into)
147
+ }
148
+
149
+ async fn scan_keys(&mut self, request: KvScanRequest) -> Result<KvKeyPage, LixError> {
150
+ self.transaction
151
+ .scan_keys(request.into())
152
+ .await
153
+ .map(Into::into)
154
+ }
155
+
156
+ async fn scan_values(&mut self, request: KvScanRequest) -> Result<KvValuePage, LixError> {
157
+ self.transaction
158
+ .scan_values(request.into())
159
+ .await
160
+ .map(Into::into)
161
+ }
162
+
163
+ async fn scan_entries(&mut self, request: KvScanRequest) -> Result<KvEntryPage, LixError> {
164
+ self.transaction
165
+ .scan_entries(request.into())
166
+ .await
167
+ .map(Into::into)
168
+ }
169
+ }
170
+
171
+ #[async_trait]
172
+ impl StorageReadTransaction for StorageContextReadTransaction {
173
+ async fn rollback(self: Box<Self>) -> Result<(), LixError> {
174
+ self.transaction.rollback().await
175
+ }
176
+ }
177
+
178
+ #[async_trait]
179
+ impl StorageReader for StorageContextWriteTransaction {
180
+ async fn get_values(&mut self, request: KvGetRequest) -> Result<KvValueBatch, LixError> {
181
+ self.transaction
182
+ .get_values(request.into())
183
+ .await
184
+ .map(Into::into)
185
+ }
186
+
187
+ async fn exists_many(&mut self, request: KvGetRequest) -> Result<KvExistsBatch, LixError> {
188
+ self.transaction
189
+ .exists_many(request.into())
190
+ .await
191
+ .map(Into::into)
192
+ }
193
+
194
+ async fn scan_keys(&mut self, request: KvScanRequest) -> Result<KvKeyPage, LixError> {
195
+ self.transaction
196
+ .scan_keys(request.into())
197
+ .await
198
+ .map(Into::into)
199
+ }
200
+
201
+ async fn scan_values(&mut self, request: KvScanRequest) -> Result<KvValuePage, LixError> {
202
+ self.transaction
203
+ .scan_values(request.into())
204
+ .await
205
+ .map(Into::into)
206
+ }
207
+
208
+ async fn scan_entries(&mut self, request: KvScanRequest) -> Result<KvEntryPage, LixError> {
209
+ self.transaction
210
+ .scan_entries(request.into())
211
+ .await
212
+ .map(Into::into)
213
+ }
214
+ }
215
+
216
+ #[async_trait]
217
+ impl StorageWriter for StorageContextWriteTransaction {
218
+ async fn write_kv_batch(&mut self, batch: KvWriteBatch) -> Result<KvWriteStats, LixError> {
219
+ self.transaction
220
+ .write_kv_batch(batch.into())
221
+ .await
222
+ .map(Into::into)
223
+ }
224
+ }
225
+
226
+ #[async_trait]
227
+ impl StorageReadTransaction for StorageContextWriteTransaction {
228
+ async fn rollback(self: Box<Self>) -> Result<(), LixError> {
229
+ self.transaction.rollback().await
230
+ }
231
+ }
232
+
233
+ #[async_trait]
234
+ impl StorageWriteTransaction for StorageContextWriteTransaction {
235
+ async fn commit(self: Box<Self>) -> Result<(), LixError> {
236
+ self.transaction.commit().await
237
+ }
238
+ }
239
+
240
+ #[cfg(test)]
241
+ mod tests {
242
+ use std::sync::Arc;
243
+
244
+ use crate::backend::testing::UnitTestBackend;
245
+ use crate::storage::types::KvWriteBatch;
246
+ use crate::storage::{KvGetGroup, KvScanRange, StorageWriteSet};
247
+
248
+ use super::*;
249
+
250
+ #[tokio::test]
251
+ async fn storage_context_roundtrips_batched_writes_and_reads() {
252
+ let backend: Arc<dyn Backend + Send + Sync> = Arc::new(UnitTestBackend::new());
253
+ let storage = StorageContext::new(backend);
254
+ let mut tx = storage
255
+ .begin_write_transaction()
256
+ .await
257
+ .expect("transaction opens");
258
+
259
+ let mut batch = KvWriteBatch::new();
260
+ batch.put("ns", b"a".to_vec(), b"1".to_vec());
261
+ batch.put("ns", b"b".to_vec(), b"2".to_vec());
262
+ let stats = tx.write_kv_batch(batch).await.expect("batch writes");
263
+ assert_eq!(stats.puts, 2);
264
+ tx.commit().await.expect("commit succeeds");
265
+
266
+ let mut tx = storage
267
+ .begin_read_transaction()
268
+ .await
269
+ .expect("read transaction opens");
270
+ let result = tx
271
+ .get_values(KvGetRequest {
272
+ groups: vec![KvGetGroup {
273
+ namespace: "ns".to_string(),
274
+ keys: vec![b"a".to_vec(), b"b".to_vec()],
275
+ }],
276
+ })
277
+ .await
278
+ .expect("batch reads");
279
+ assert_eq!(result.groups[0].value(0), Some(Some(b"1".as_slice())));
280
+ assert_eq!(result.groups[0].value(1), Some(Some(b"2".as_slice())));
281
+
282
+ let exists = tx
283
+ .exists_many(KvGetRequest {
284
+ groups: vec![KvGetGroup {
285
+ namespace: "ns".to_string(),
286
+ keys: vec![b"a".to_vec(), b"missing".to_vec()],
287
+ }],
288
+ })
289
+ .await
290
+ .expect("existence reads");
291
+ assert_eq!(exists.groups[0].exists, vec![true, false]);
292
+
293
+ let result = tx
294
+ .scan_entries(KvScanRequest {
295
+ namespace: "ns".to_string(),
296
+ range: KvScanRange::prefix(Vec::new()),
297
+ after: Some(b"a".to_vec()),
298
+ limit: 1,
299
+ })
300
+ .await
301
+ .expect("scan reads");
302
+ assert_eq!(result.key(0).expect("key exists"), b"b");
303
+ assert_eq!(result.value(0).expect("value exists"), b"2");
304
+
305
+ let key_only = tx
306
+ .scan_keys(KvScanRequest {
307
+ namespace: "ns".to_string(),
308
+ range: KvScanRange::prefix(Vec::new()),
309
+ after: None,
310
+ limit: 2,
311
+ })
312
+ .await
313
+ .expect("key-only scan reads");
314
+ assert_eq!(key_only.keys.iter().collect::<Vec<_>>(), vec![b"a", b"b"]);
315
+ tx.rollback().await.expect("rollback succeeds");
316
+ }
317
+
318
+ #[tokio::test]
319
+ async fn storage_write_set_applies_as_one_batch() {
320
+ let backend: Arc<dyn Backend + Send + Sync> = Arc::new(UnitTestBackend::new());
321
+ let storage = StorageContext::new(backend);
322
+ let mut tx = storage
323
+ .begin_write_transaction()
324
+ .await
325
+ .expect("transaction opens");
326
+
327
+ let mut writes = StorageWriteSet::new();
328
+ assert!(writes.is_empty());
329
+ writes.put("ns", b"a".to_vec(), b"1".to_vec());
330
+ writes.put("ns", b"b".to_vec(), b"2".to_vec());
331
+ writes.delete("ns", b"missing".to_vec());
332
+ assert!(!writes.is_empty());
333
+
334
+ let stats = writes.apply(tx.as_mut()).await.expect("write set applies");
335
+ assert_eq!(stats.puts, 2);
336
+ assert_eq!(stats.deletes, 1);
337
+ tx.commit().await.expect("commit succeeds");
338
+
339
+ let mut tx = storage
340
+ .begin_read_transaction()
341
+ .await
342
+ .expect("read transaction opens");
343
+ let result = tx
344
+ .get_values(KvGetRequest {
345
+ groups: vec![KvGetGroup {
346
+ namespace: "ns".to_string(),
347
+ keys: vec![b"a".to_vec(), b"b".to_vec()],
348
+ }],
349
+ })
350
+ .await
351
+ .expect("batch reads");
352
+ assert_eq!(result.groups[0].value(0), Some(Some(&b"1"[..])));
353
+ assert_eq!(result.groups[0].value(1), Some(Some(&b"2"[..])));
354
+ tx.rollback().await.expect("rollback succeeds");
355
+ }
356
+ }
@@ -0,0 +1,14 @@
1
+ mod context;
2
+ mod read_scope;
3
+ mod types;
4
+
5
+ pub(crate) use context::StorageContext;
6
+ pub(crate) use read_scope::{ScopedStorageReader, StorageReadScope};
7
+ pub(crate) use types::{
8
+ KvEntryPage, KvExistsBatch, KvExistsGroup, KvGetGroup, KvGetRequest, KvKeyPage, KvScanRange,
9
+ KvScanRequest, KvValueBatch, KvValueGroup, KvValuePage, KvWriteStats, StorageReadTransaction,
10
+ StorageReader, StorageWriteSet, StorageWriteTransaction,
11
+ };
12
+
13
+ #[cfg(feature = "storage-benches")]
14
+ pub(crate) use types::{KvWriteBatch, KvWriteGroup};