@lix-js/sdk 0.6.0-preview.4 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (223) hide show
  1. package/README.md +76 -4
  2. package/dist/errors.d.ts +7 -0
  3. package/dist/errors.js +19 -0
  4. package/dist/index.d.ts +4 -5
  5. package/dist/index.js +3 -3
  6. package/dist/native.d.ts +1 -0
  7. package/dist/native.js +47 -0
  8. package/dist/open-lix.d.ts +39 -201
  9. package/dist/open-lix.js +59 -284
  10. package/dist/result.d.ts +18 -0
  11. package/dist/result.js +48 -0
  12. package/dist/types.d.ts +114 -1
  13. package/dist/value.d.ts +28 -0
  14. package/dist/value.js +245 -0
  15. package/package.json +20 -50
  16. package/SKILL.md +0 -506
  17. package/dist/builtin-schemas.d.ts +0 -1
  18. package/dist/builtin-schemas.js +0 -1
  19. package/dist/engine-wasm/index.d.ts +0 -87
  20. package/dist/engine-wasm/index.js +0 -339
  21. package/dist/engine-wasm/wasm/lix_engine.d.ts +0 -79
  22. package/dist/engine-wasm/wasm/lix_engine.js +0 -821
  23. package/dist/engine-wasm/wasm/lix_engine.wasm +0 -0
  24. package/dist/engine-wasm/wasm/lix_engine.wasm.d.ts +0 -26
  25. package/dist/generated/builtin-schemas.d.ts +0 -427
  26. package/dist/generated/builtin-schemas.js +0 -643
  27. package/dist/sqlite/index.d.ts +0 -12
  28. package/dist/sqlite/index.js +0 -303
  29. package/dist-engine-src/README.md +0 -18
  30. package/dist-engine-src/src/backend/kv.rs +0 -358
  31. package/dist-engine-src/src/backend/mod.rs +0 -12
  32. package/dist-engine-src/src/backend/testing.rs +0 -658
  33. package/dist-engine-src/src/backend/types.rs +0 -96
  34. package/dist-engine-src/src/binary_cas/chunking.rs +0 -31
  35. package/dist-engine-src/src/binary_cas/codec.rs +0 -346
  36. package/dist-engine-src/src/binary_cas/context.rs +0 -139
  37. package/dist-engine-src/src/binary_cas/kv.rs +0 -1063
  38. package/dist-engine-src/src/binary_cas/mod.rs +0 -11
  39. package/dist-engine-src/src/binary_cas/types.rs +0 -121
  40. package/dist-engine-src/src/catalog/context.rs +0 -412
  41. package/dist-engine-src/src/catalog/mod.rs +0 -10
  42. package/dist-engine-src/src/catalog/schema.rs +0 -4
  43. package/dist-engine-src/src/catalog/snapshot.rs +0 -1114
  44. package/dist-engine-src/src/cel/context.rs +0 -86
  45. package/dist-engine-src/src/cel/error.rs +0 -19
  46. package/dist-engine-src/src/cel/mod.rs +0 -8
  47. package/dist-engine-src/src/cel/provider.rs +0 -9
  48. package/dist-engine-src/src/cel/runtime.rs +0 -167
  49. package/dist-engine-src/src/cel/value.rs +0 -50
  50. package/dist-engine-src/src/commit_graph/context.rs +0 -901
  51. package/dist-engine-src/src/commit_graph/mod.rs +0 -11
  52. package/dist-engine-src/src/commit_graph/types.rs +0 -109
  53. package/dist-engine-src/src/commit_graph/walker.rs +0 -756
  54. package/dist-engine-src/src/commit_store/codec.rs +0 -887
  55. package/dist-engine-src/src/commit_store/context.rs +0 -944
  56. package/dist-engine-src/src/commit_store/materialization.rs +0 -84
  57. package/dist-engine-src/src/commit_store/mod.rs +0 -16
  58. package/dist-engine-src/src/commit_store/storage.rs +0 -600
  59. package/dist-engine-src/src/commit_store/types.rs +0 -215
  60. package/dist-engine-src/src/common/error.rs +0 -313
  61. package/dist-engine-src/src/common/fingerprint.rs +0 -3
  62. package/dist-engine-src/src/common/fs_path.rs +0 -1336
  63. package/dist-engine-src/src/common/identity.rs +0 -145
  64. package/dist-engine-src/src/common/json_pointer.rs +0 -67
  65. package/dist-engine-src/src/common/metadata.rs +0 -40
  66. package/dist-engine-src/src/common/mod.rs +0 -23
  67. package/dist-engine-src/src/common/types.rs +0 -105
  68. package/dist-engine-src/src/common/wire.rs +0 -222
  69. package/dist-engine-src/src/domain.rs +0 -324
  70. package/dist-engine-src/src/engine.rs +0 -225
  71. package/dist-engine-src/src/entity_identity.rs +0 -405
  72. package/dist-engine-src/src/functions/context.rs +0 -292
  73. package/dist-engine-src/src/functions/deterministic.rs +0 -113
  74. package/dist-engine-src/src/functions/mod.rs +0 -18
  75. package/dist-engine-src/src/functions/provider.rs +0 -130
  76. package/dist-engine-src/src/functions/state.rs +0 -336
  77. package/dist-engine-src/src/functions/types.rs +0 -37
  78. package/dist-engine-src/src/init.rs +0 -558
  79. package/dist-engine-src/src/json_store/compression.rs +0 -77
  80. package/dist-engine-src/src/json_store/context.rs +0 -423
  81. package/dist-engine-src/src/json_store/encoded.rs +0 -15
  82. package/dist-engine-src/src/json_store/mod.rs +0 -12
  83. package/dist-engine-src/src/json_store/store.rs +0 -1109
  84. package/dist-engine-src/src/json_store/types.rs +0 -217
  85. package/dist-engine-src/src/lib.rs +0 -62
  86. package/dist-engine-src/src/live_state/context.rs +0 -2019
  87. package/dist-engine-src/src/live_state/mod.rs +0 -15
  88. package/dist-engine-src/src/live_state/overlay.rs +0 -75
  89. package/dist-engine-src/src/live_state/reader.rs +0 -23
  90. package/dist-engine-src/src/live_state/types.rs +0 -222
  91. package/dist-engine-src/src/live_state/visibility.rs +0 -223
  92. package/dist-engine-src/src/plugin/archive.rs +0 -438
  93. package/dist-engine-src/src/plugin/component.rs +0 -183
  94. package/dist-engine-src/src/plugin/install.rs +0 -619
  95. package/dist-engine-src/src/plugin/manifest.rs +0 -516
  96. package/dist-engine-src/src/plugin/materializer.rs +0 -477
  97. package/dist-engine-src/src/plugin/mod.rs +0 -33
  98. package/dist-engine-src/src/plugin/plugin_manifest.json +0 -118
  99. package/dist-engine-src/src/plugin/storage.rs +0 -74
  100. package/dist-engine-src/src/schema/annotations/defaults.rs +0 -275
  101. package/dist-engine-src/src/schema/annotations/mod.rs +0 -1
  102. package/dist-engine-src/src/schema/builtin/lix_account.json +0 -21
  103. package/dist-engine-src/src/schema/builtin/lix_active_account.json +0 -29
  104. package/dist-engine-src/src/schema/builtin/lix_binary_blob_ref.json +0 -29
  105. package/dist-engine-src/src/schema/builtin/lix_change.json +0 -63
  106. package/dist-engine-src/src/schema/builtin/lix_change_author.json +0 -45
  107. package/dist-engine-src/src/schema/builtin/lix_commit.json +0 -24
  108. package/dist-engine-src/src/schema/builtin/lix_commit_edge.json +0 -53
  109. package/dist-engine-src/src/schema/builtin/lix_directory_descriptor.json +0 -52
  110. package/dist-engine-src/src/schema/builtin/lix_file_descriptor.json +0 -52
  111. package/dist-engine-src/src/schema/builtin/lix_key_value.json +0 -40
  112. package/dist-engine-src/src/schema/builtin/lix_label.json +0 -29
  113. package/dist-engine-src/src/schema/builtin/lix_label_assignment.json +0 -74
  114. package/dist-engine-src/src/schema/builtin/lix_registered_schema.json +0 -25
  115. package/dist-engine-src/src/schema/builtin/lix_version_descriptor.json +0 -34
  116. package/dist-engine-src/src/schema/builtin/lix_version_ref.json +0 -48
  117. package/dist-engine-src/src/schema/builtin/mod.rs +0 -222
  118. package/dist-engine-src/src/schema/compatibility.rs +0 -787
  119. package/dist-engine-src/src/schema/definition.json +0 -187
  120. package/dist-engine-src/src/schema/definition.rs +0 -742
  121. package/dist-engine-src/src/schema/key.rs +0 -138
  122. package/dist-engine-src/src/schema/mod.rs +0 -20
  123. package/dist-engine-src/src/schema/seed.rs +0 -14
  124. package/dist-engine-src/src/schema/tests.rs +0 -780
  125. package/dist-engine-src/src/session/context.rs +0 -404
  126. package/dist-engine-src/src/session/create_version.rs +0 -88
  127. package/dist-engine-src/src/session/execute.rs +0 -541
  128. package/dist-engine-src/src/session/merge/analysis.rs +0 -102
  129. package/dist-engine-src/src/session/merge/apply.rs +0 -23
  130. package/dist-engine-src/src/session/merge/conflicts.rs +0 -63
  131. package/dist-engine-src/src/session/merge/mod.rs +0 -11
  132. package/dist-engine-src/src/session/merge/stats.rs +0 -65
  133. package/dist-engine-src/src/session/merge/version.rs +0 -427
  134. package/dist-engine-src/src/session/mod.rs +0 -27
  135. package/dist-engine-src/src/session/optimization9_sql2_bench.rs +0 -100
  136. package/dist-engine-src/src/session/switch_version.rs +0 -110
  137. package/dist-engine-src/src/session/transaction.rs +0 -76
  138. package/dist-engine-src/src/sql2/change_provider.rs +0 -331
  139. package/dist-engine-src/src/sql2/classify.rs +0 -174
  140. package/dist-engine-src/src/sql2/context.rs +0 -311
  141. package/dist-engine-src/src/sql2/directory_history_provider.rs +0 -631
  142. package/dist-engine-src/src/sql2/directory_provider.rs +0 -2453
  143. package/dist-engine-src/src/sql2/dml.rs +0 -148
  144. package/dist-engine-src/src/sql2/entity_history_provider.rs +0 -440
  145. package/dist-engine-src/src/sql2/entity_provider.rs +0 -3211
  146. package/dist-engine-src/src/sql2/error.rs +0 -215
  147. package/dist-engine-src/src/sql2/execute.rs +0 -3533
  148. package/dist-engine-src/src/sql2/file_history_provider.rs +0 -910
  149. package/dist-engine-src/src/sql2/file_provider.rs +0 -3679
  150. package/dist-engine-src/src/sql2/filesystem_planner.rs +0 -1490
  151. package/dist-engine-src/src/sql2/filesystem_predicates.rs +0 -159
  152. package/dist-engine-src/src/sql2/filesystem_visibility.rs +0 -383
  153. package/dist-engine-src/src/sql2/history_projection.rs +0 -56
  154. package/dist-engine-src/src/sql2/history_provider.rs +0 -412
  155. package/dist-engine-src/src/sql2/history_route.rs +0 -657
  156. package/dist-engine-src/src/sql2/lix_state_provider.rs +0 -2512
  157. package/dist-engine-src/src/sql2/mod.rs +0 -47
  158. package/dist-engine-src/src/sql2/predicate_typecheck.rs +0 -246
  159. package/dist-engine-src/src/sql2/public_bind/assignment.rs +0 -46
  160. package/dist-engine-src/src/sql2/public_bind/capability.rs +0 -41
  161. package/dist-engine-src/src/sql2/public_bind/dml.rs +0 -172
  162. package/dist-engine-src/src/sql2/public_bind/mod.rs +0 -26
  163. package/dist-engine-src/src/sql2/public_bind/table.rs +0 -168
  164. package/dist-engine-src/src/sql2/read_only.rs +0 -63
  165. package/dist-engine-src/src/sql2/record_batch.rs +0 -17
  166. package/dist-engine-src/src/sql2/result_metadata.rs +0 -29
  167. package/dist-engine-src/src/sql2/runtime.rs +0 -60
  168. package/dist-engine-src/src/sql2/session.rs +0 -132
  169. package/dist-engine-src/src/sql2/udfs/common.rs +0 -295
  170. package/dist-engine-src/src/sql2/udfs/lix_active_version_commit_id.rs +0 -53
  171. package/dist-engine-src/src/sql2/udfs/lix_empty_blob.rs +0 -47
  172. package/dist-engine-src/src/sql2/udfs/lix_json.rs +0 -100
  173. package/dist-engine-src/src/sql2/udfs/lix_json_get.rs +0 -99
  174. package/dist-engine-src/src/sql2/udfs/lix_json_get_text.rs +0 -99
  175. package/dist-engine-src/src/sql2/udfs/lix_text_decode.rs +0 -82
  176. package/dist-engine-src/src/sql2/udfs/lix_text_encode.rs +0 -85
  177. package/dist-engine-src/src/sql2/udfs/lix_timestamp.rs +0 -76
  178. package/dist-engine-src/src/sql2/udfs/lix_uuid_v7.rs +0 -76
  179. package/dist-engine-src/src/sql2/udfs/mod.rs +0 -89
  180. package/dist-engine-src/src/sql2/udfs/public_call.rs +0 -238
  181. package/dist-engine-src/src/sql2/version_provider.rs +0 -1202
  182. package/dist-engine-src/src/sql2/version_scope.rs +0 -394
  183. package/dist-engine-src/src/sql2/write_normalization.rs +0 -345
  184. package/dist-engine-src/src/storage/context.rs +0 -356
  185. package/dist-engine-src/src/storage/mod.rs +0 -14
  186. package/dist-engine-src/src/storage/read_scope.rs +0 -88
  187. package/dist-engine-src/src/storage/types.rs +0 -501
  188. package/dist-engine-src/src/storage_bench.rs +0 -4863
  189. package/dist-engine-src/src/test_support.rs +0 -228
  190. package/dist-engine-src/src/tracked_state/by_file_index.rs +0 -98
  191. package/dist-engine-src/src/tracked_state/codec.rs +0 -2085
  192. package/dist-engine-src/src/tracked_state/context.rs +0 -1867
  193. package/dist-engine-src/src/tracked_state/diff.rs +0 -686
  194. package/dist-engine-src/src/tracked_state/materialization.rs +0 -403
  195. package/dist-engine-src/src/tracked_state/materializer.rs +0 -488
  196. package/dist-engine-src/src/tracked_state/merge.rs +0 -492
  197. package/dist-engine-src/src/tracked_state/mod.rs +0 -32
  198. package/dist-engine-src/src/tracked_state/storage.rs +0 -375
  199. package/dist-engine-src/src/tracked_state/tree.rs +0 -3187
  200. package/dist-engine-src/src/tracked_state/types.rs +0 -231
  201. package/dist-engine-src/src/transaction/commit.rs +0 -1484
  202. package/dist-engine-src/src/transaction/context.rs +0 -1548
  203. package/dist-engine-src/src/transaction/live_state_overlay.rs +0 -35
  204. package/dist-engine-src/src/transaction/mod.rs +0 -13
  205. package/dist-engine-src/src/transaction/normalization.rs +0 -890
  206. package/dist-engine-src/src/transaction/prep.rs +0 -37
  207. package/dist-engine-src/src/transaction/schema_resolver.rs +0 -149
  208. package/dist-engine-src/src/transaction/staging.rs +0 -1731
  209. package/dist-engine-src/src/transaction/types.rs +0 -460
  210. package/dist-engine-src/src/transaction/validation.rs +0 -5830
  211. package/dist-engine-src/src/untracked_state/codec.rs +0 -307
  212. package/dist-engine-src/src/untracked_state/context.rs +0 -98
  213. package/dist-engine-src/src/untracked_state/materialization.rs +0 -63
  214. package/dist-engine-src/src/untracked_state/mod.rs +0 -15
  215. package/dist-engine-src/src/untracked_state/storage.rs +0 -396
  216. package/dist-engine-src/src/untracked_state/types.rs +0 -146
  217. package/dist-engine-src/src/version/context.rs +0 -40
  218. package/dist-engine-src/src/version/lifecycle.rs +0 -221
  219. package/dist-engine-src/src/version/mod.rs +0 -13
  220. package/dist-engine-src/src/version/refs.rs +0 -330
  221. package/dist-engine-src/src/version/stage_rows.rs +0 -67
  222. package/dist-engine-src/src/version/types.rs +0 -21
  223. package/dist-engine-src/src/wasm/mod.rs +0 -60
@@ -1,110 +0,0 @@
1
- use std::sync::Arc;
2
-
3
- use serde_json::json;
4
-
5
- use crate::transaction::types::{TransactionJson, TransactionWriteRow};
6
- use crate::version::{VersionLifecycle, VersionOperation, VersionReferenceRole};
7
- use crate::LixError;
8
- use crate::GLOBAL_VERSION_ID;
9
-
10
- use super::context::{SessionContext, SessionMode, WORKSPACE_VERSION_KEY};
11
-
12
- const KEY_VALUE_SCHEMA_KEY: &str = "lix_key_value";
13
-
14
- /// Options for switching a session to another version.
15
- #[derive(Debug, Clone, PartialEq, Eq)]
16
- pub struct SwitchVersionOptions {
17
- pub version_id: String,
18
- }
19
-
20
- /// Receipt returned after switching to another version.
21
- #[derive(Debug, Clone, PartialEq, Eq)]
22
- pub struct SwitchVersionReceipt {
23
- pub version_id: String,
24
- }
25
-
26
- impl SessionContext {
27
- /// Switches the session's active version selector.
28
- ///
29
- /// Pinned sessions switch in memory and return a new pinned session.
30
- /// Workspace sessions update the shared workspace selector so other
31
- /// workspace sessions observe the new active version on their next use.
32
- pub async fn switch_version(
33
- &self,
34
- options: SwitchVersionOptions,
35
- ) -> Result<(SessionContext, SwitchVersionReceipt), LixError> {
36
- let version_id = options.version_id;
37
- let receipt_version_id = version_id.clone();
38
- let current_mode = self.mode.clone();
39
- let next_mode = self
40
- .with_write_transaction(|transaction| {
41
- Box::pin(async move {
42
- {
43
- let reader = transaction.version_ref_reader();
44
- VersionLifecycle::new(&reader)
45
- .require_existing_commit_id(
46
- &version_id,
47
- VersionOperation::SwitchVersion,
48
- VersionReferenceRole::Target,
49
- )
50
- .await?
51
- };
52
-
53
- match current_mode {
54
- SessionMode::Pinned { .. } => Ok(SessionMode::Pinned {
55
- version_id: version_id.clone(),
56
- }),
57
- SessionMode::Workspace => {
58
- transaction
59
- .stage_rows(vec![workspace_version_stage_row(&version_id)?])
60
- .await?;
61
- Ok(SessionMode::Workspace)
62
- }
63
- }
64
- })
65
- })
66
- .await?;
67
-
68
- let session = SessionContext::new_with_closed(
69
- next_mode,
70
- self.storage.clone(),
71
- Arc::clone(&self.live_state),
72
- Arc::clone(&self.tracked_state),
73
- Arc::clone(&self.binary_cas),
74
- Arc::clone(&self.commit_store),
75
- Arc::clone(&self.version_ctx),
76
- Arc::clone(&self.catalog_context),
77
- self.closed_flag(),
78
- self.active_transaction_flag(),
79
- );
80
- Ok((
81
- session,
82
- SwitchVersionReceipt {
83
- version_id: receipt_version_id,
84
- },
85
- ))
86
- }
87
- }
88
-
89
- fn workspace_version_stage_row(version_id: &str) -> Result<TransactionWriteRow, LixError> {
90
- Ok(TransactionWriteRow {
91
- entity_id: Some(crate::entity_identity::EntityIdentity::single(
92
- WORKSPACE_VERSION_KEY,
93
- )),
94
- schema_key: KEY_VALUE_SCHEMA_KEY.to_string(),
95
- file_id: None,
96
- snapshot: Some(TransactionJson::from_value_unchecked(json!({
97
- "key": WORKSPACE_VERSION_KEY,
98
- "value": version_id,
99
- }))),
100
- metadata: None,
101
- origin: None,
102
- created_at: None,
103
- updated_at: None,
104
- global: true,
105
- change_id: None,
106
- commit_id: None,
107
- untracked: true,
108
- version_id: GLOBAL_VERSION_ID.to_string(),
109
- })
110
- }
@@ -1,76 +0,0 @@
1
- use std::sync::Arc;
2
-
3
- use crate::functions::FunctionContext;
4
- use crate::transaction::{open_transaction, Transaction};
5
- use crate::LixError;
6
-
7
- use super::context::SessionTransactionGuard;
8
- use super::SessionContext;
9
-
10
- pub struct SessionTransaction {
11
- pub(super) transaction: Option<Transaction>,
12
- pub(super) runtime_functions: FunctionContext,
13
- _transaction_guard: SessionTransactionGuard,
14
- }
15
-
16
- impl SessionContext {
17
- pub async fn begin_transaction(&self) -> Result<SessionTransaction, LixError> {
18
- self.ensure_open()?;
19
- let transaction_guard = self.reserve_session_transaction()?;
20
- let opened = match open_transaction(
21
- &self.mode,
22
- self.storage.clone(),
23
- Arc::clone(&self.live_state),
24
- Arc::clone(&self.tracked_state),
25
- Arc::clone(&self.binary_cas),
26
- Arc::clone(&self.commit_store),
27
- Arc::clone(&self.version_ctx),
28
- Arc::clone(&self.catalog_context),
29
- )
30
- .await
31
- {
32
- Ok(opened) => opened,
33
- Err(error) => {
34
- return Err(error);
35
- }
36
- };
37
- Ok(SessionTransaction {
38
- transaction: Some(opened.transaction),
39
- runtime_functions: opened.runtime_functions,
40
- _transaction_guard: transaction_guard,
41
- })
42
- }
43
- }
44
-
45
- impl SessionTransaction {
46
- pub(super) fn transaction_mut(&mut self) -> Result<&mut Transaction, LixError> {
47
- self.transaction
48
- .as_mut()
49
- .ok_or_else(|| transaction_state_error("Lix transaction is closed"))
50
- }
51
-
52
- pub async fn commit(mut self) -> Result<(), LixError> {
53
- let transaction = self
54
- .transaction
55
- .take()
56
- .ok_or_else(|| transaction_state_error("Lix transaction is closed"))?;
57
- let result = transaction
58
- .commit(&self.runtime_functions)
59
- .await
60
- .map(|_| ());
61
- result
62
- }
63
-
64
- pub async fn rollback(mut self) -> Result<(), LixError> {
65
- let transaction = self
66
- .transaction
67
- .take()
68
- .ok_or_else(|| transaction_state_error("Lix transaction is closed"))?;
69
- let result = transaction.rollback().await;
70
- result
71
- }
72
- }
73
-
74
- pub(crate) fn transaction_state_error(message: impl Into<String>) -> LixError {
75
- LixError::new("LIX_INVALID_TRANSACTION_STATE", message)
76
- }
@@ -1,331 +0,0 @@
1
- use std::any::Any;
2
- use std::sync::Arc;
3
-
4
- use async_trait::async_trait;
5
- use datafusion::arrow::array::{ArrayRef, StringArray};
6
- use datafusion::arrow::datatypes::{DataType, Field, Schema, SchemaRef};
7
- use datafusion::arrow::record_batch::RecordBatch;
8
- use datafusion::catalog::{Session, TableProvider};
9
- use datafusion::common::{DataFusionError, Result};
10
- use datafusion::datasource::TableType;
11
- use datafusion::execution::TaskContext;
12
- use datafusion::logical_expr::{Expr, TableProviderFilterPushDown};
13
- use datafusion::physical_expr::EquivalenceProperties;
14
- use datafusion::physical_plan::execution_plan::{Boundedness, EmissionType, PlanProperties};
15
- use datafusion::physical_plan::stream::RecordBatchStreamAdapter;
16
- use datafusion::physical_plan::{
17
- DisplayAs, DisplayFormatType, ExecutionPlan, Partitioning, SendableRecordBatchStream,
18
- };
19
- use futures_util::stream;
20
-
21
- use crate::commit_store::ChangeScanRequest;
22
- use crate::serialize_row_metadata;
23
- use crate::LixError;
24
-
25
- use super::record_batch::record_batch_with_row_count;
26
- use super::result_metadata::json_field;
27
- use super::SqlCommitStoreQuerySource;
28
- use crate::commit_store::{materialize_change, MaterializedChange};
29
-
30
- pub(crate) async fn register_lix_change_provider(
31
- session: &datafusion::prelude::SessionContext,
32
- query_source: SqlCommitStoreQuerySource,
33
- ) -> Result<(), LixError> {
34
- session
35
- .register_table("lix_change", Arc::new(LixChangeProvider::new(query_source)))
36
- .map_err(datafusion_error_to_lix_error)?;
37
- Ok(())
38
- }
39
-
40
- struct LixChangeProvider {
41
- schema: SchemaRef,
42
- query_source: SqlCommitStoreQuerySource,
43
- }
44
-
45
- impl std::fmt::Debug for LixChangeProvider {
46
- fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
47
- f.debug_struct("LixChangeProvider").finish()
48
- }
49
- }
50
-
51
- impl LixChangeProvider {
52
- fn new(query_source: SqlCommitStoreQuerySource) -> Self {
53
- Self {
54
- schema: lix_change_schema(),
55
- query_source,
56
- }
57
- }
58
- }
59
-
60
- #[async_trait]
61
- impl TableProvider for LixChangeProvider {
62
- fn as_any(&self) -> &dyn Any {
63
- self
64
- }
65
-
66
- fn schema(&self) -> SchemaRef {
67
- Arc::clone(&self.schema)
68
- }
69
-
70
- fn table_type(&self) -> TableType {
71
- TableType::Base
72
- }
73
-
74
- fn supports_filters_pushdown(
75
- &self,
76
- filters: &[&Expr],
77
- ) -> Result<Vec<TableProviderFilterPushDown>> {
78
- Ok(filters
79
- .iter()
80
- .map(|_| TableProviderFilterPushDown::Unsupported)
81
- .collect())
82
- }
83
-
84
- async fn scan(
85
- &self,
86
- _state: &dyn Session,
87
- projection: Option<&Vec<usize>>,
88
- _filters: &[Expr],
89
- limit: Option<usize>,
90
- ) -> Result<Arc<dyn ExecutionPlan>> {
91
- Ok(Arc::new(LixChangeScanExec::new(
92
- self.query_source.clone(),
93
- projected_schema(&self.schema, projection),
94
- projection.cloned(),
95
- limit,
96
- )))
97
- }
98
- }
99
-
100
- struct LixChangeScanExec {
101
- query_source: SqlCommitStoreQuerySource,
102
- schema: SchemaRef,
103
- projection: Option<Vec<usize>>,
104
- limit: Option<usize>,
105
- properties: Arc<PlanProperties>,
106
- }
107
-
108
- impl std::fmt::Debug for LixChangeScanExec {
109
- fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
110
- f.debug_struct("LixChangeScanExec").finish()
111
- }
112
- }
113
-
114
- impl LixChangeScanExec {
115
- fn new(
116
- query_source: SqlCommitStoreQuerySource,
117
- schema: SchemaRef,
118
- projection: Option<Vec<usize>>,
119
- limit: Option<usize>,
120
- ) -> Self {
121
- let properties = PlanProperties::new(
122
- EquivalenceProperties::new(schema.clone()),
123
- Partitioning::UnknownPartitioning(1),
124
- EmissionType::Incremental,
125
- Boundedness::Bounded,
126
- );
127
- Self {
128
- query_source,
129
- schema,
130
- projection,
131
- limit,
132
- properties: Arc::new(properties),
133
- }
134
- }
135
- }
136
-
137
- impl DisplayAs for LixChangeScanExec {
138
- fn fmt_as(&self, t: DisplayFormatType, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
139
- match t {
140
- DisplayFormatType::Default | DisplayFormatType::Verbose => {
141
- write!(f, "LixChangeScanExec")
142
- }
143
- DisplayFormatType::TreeRender => write!(f, "LixChangeScanExec"),
144
- }
145
- }
146
- }
147
-
148
- impl ExecutionPlan for LixChangeScanExec {
149
- fn name(&self) -> &str {
150
- "LixChangeScanExec"
151
- }
152
-
153
- fn as_any(&self) -> &dyn Any {
154
- self
155
- }
156
-
157
- fn properties(&self) -> &Arc<PlanProperties> {
158
- &self.properties
159
- }
160
-
161
- fn children(&self) -> Vec<&Arc<dyn ExecutionPlan>> {
162
- Vec::new()
163
- }
164
-
165
- fn with_new_children(
166
- self: Arc<Self>,
167
- children: Vec<Arc<dyn ExecutionPlan>>,
168
- ) -> Result<Arc<dyn ExecutionPlan>> {
169
- if !children.is_empty() {
170
- return Err(DataFusionError::Execution(
171
- "LixChangeScanExec does not accept children".to_string(),
172
- ));
173
- }
174
- Ok(self)
175
- }
176
-
177
- fn execute(
178
- &self,
179
- partition: usize,
180
- _context: Arc<TaskContext>,
181
- ) -> Result<SendableRecordBatchStream> {
182
- if partition != 0 {
183
- return Err(DataFusionError::Execution(format!(
184
- "LixChangeScanExec only exposes one partition, got {partition}"
185
- )));
186
- }
187
-
188
- let query_source = self.query_source.clone();
189
- let projection = change_projection_for_scan(self.projection.as_ref());
190
- let limit = self.limit;
191
- let schema = Arc::clone(&self.schema);
192
- let stream = stream::once(async move {
193
- let mut json_reader = query_source.json_reader;
194
- let canonical_changes = query_source
195
- .commit_store_reader
196
- .scan_changes(&ChangeScanRequest { limit })
197
- .await
198
- .map_err(lix_error_to_datafusion_error)?;
199
- let mut changes = Vec::with_capacity(canonical_changes.len());
200
- for change in canonical_changes {
201
- changes.push(
202
- materialize_change(&mut json_reader, change)
203
- .await
204
- .map_err(lix_error_to_datafusion_error)?,
205
- );
206
- }
207
- change_record_batch(&projection, &changes)
208
- });
209
- Ok(Box::pin(RecordBatchStreamAdapter::new(schema, stream)))
210
- }
211
- }
212
-
213
- #[derive(Debug, Clone, Copy)]
214
- enum ChangeColumn {
215
- Id,
216
- EntityId,
217
- SchemaKey,
218
- FileId,
219
- Metadata,
220
- CreatedAt,
221
- SnapshotContent,
222
- }
223
-
224
- fn lix_change_schema() -> SchemaRef {
225
- Arc::new(Schema::new(vec![
226
- Field::new("id", DataType::Utf8, false),
227
- json_field("entity_id", false),
228
- Field::new("schema_key", DataType::Utf8, false),
229
- Field::new("file_id", DataType::Utf8, true),
230
- json_field("metadata", true),
231
- Field::new("created_at", DataType::Utf8, false),
232
- json_field("snapshot_content", true),
233
- ]))
234
- }
235
-
236
- fn change_projection_for_scan(projection: Option<&Vec<usize>>) -> Vec<ChangeColumn> {
237
- let all_columns = vec![
238
- ChangeColumn::Id,
239
- ChangeColumn::EntityId,
240
- ChangeColumn::SchemaKey,
241
- ChangeColumn::FileId,
242
- ChangeColumn::Metadata,
243
- ChangeColumn::CreatedAt,
244
- ChangeColumn::SnapshotContent,
245
- ];
246
- projection.map_or(all_columns.clone(), |indices| {
247
- indices
248
- .iter()
249
- .filter_map(|index| all_columns.get(*index).copied())
250
- .collect()
251
- })
252
- }
253
-
254
- fn projected_schema(schema: &SchemaRef, projection: Option<&Vec<usize>>) -> SchemaRef {
255
- match projection {
256
- Some(projection) => Arc::new(schema.project(projection).expect("projection is valid")),
257
- None => Arc::clone(schema),
258
- }
259
- }
260
-
261
- fn change_record_batch(
262
- projection: &[ChangeColumn],
263
- changes: &[MaterializedChange],
264
- ) -> Result<RecordBatch> {
265
- let arrays = projection
266
- .iter()
267
- .map(|column| match column {
268
- ChangeColumn::Id => string_array(changes.iter().map(|row| Some(row.id.as_str()))),
269
- ChangeColumn::EntityId => Arc::new(StringArray::from(
270
- changes
271
- .iter()
272
- .map(|row| {
273
- Some(
274
- row.entity_id
275
- .as_json_array_text()
276
- .expect("canonical change entity identity should project"),
277
- )
278
- })
279
- .collect::<Vec<_>>(),
280
- )) as ArrayRef,
281
- ChangeColumn::SchemaKey => {
282
- string_array(changes.iter().map(|row| Some(row.schema_key.as_str())))
283
- }
284
- ChangeColumn::FileId => string_array(changes.iter().map(|row| row.file_id.as_deref())),
285
- ChangeColumn::Metadata => Arc::new(StringArray::from(
286
- changes
287
- .iter()
288
- .map(|row| row.metadata.as_ref().map(serialize_row_metadata))
289
- .collect::<Vec<_>>(),
290
- )),
291
- ChangeColumn::CreatedAt => {
292
- string_array(changes.iter().map(|row| Some(row.created_at.as_str())))
293
- }
294
- ChangeColumn::SnapshotContent => {
295
- string_array(changes.iter().map(|row| row.snapshot_content.as_deref()))
296
- }
297
- })
298
- .collect::<Vec<_>>();
299
- record_batch_with_row_count(change_schema(projection), arrays, changes.len()).map_err(|error| {
300
- DataFusionError::Execution(format!("failed to build lix_change batch: {error}"))
301
- })
302
- }
303
-
304
- fn change_schema(projection: &[ChangeColumn]) -> SchemaRef {
305
- Arc::new(Schema::new(
306
- projection
307
- .iter()
308
- .map(|column| match column {
309
- ChangeColumn::Id => Field::new("id", DataType::Utf8, false),
310
- ChangeColumn::EntityId => json_field("entity_id", false),
311
- ChangeColumn::SchemaKey => Field::new("schema_key", DataType::Utf8, false),
312
- ChangeColumn::FileId => Field::new("file_id", DataType::Utf8, true),
313
- ChangeColumn::Metadata => json_field("metadata", true),
314
- ChangeColumn::CreatedAt => Field::new("created_at", DataType::Utf8, false),
315
- ChangeColumn::SnapshotContent => json_field("snapshot_content", true),
316
- })
317
- .collect::<Vec<_>>(),
318
- ))
319
- }
320
-
321
- fn string_array<'a>(values: impl Iterator<Item = Option<&'a str>>) -> ArrayRef {
322
- Arc::new(StringArray::from(values.collect::<Vec<_>>())) as ArrayRef
323
- }
324
-
325
- fn datafusion_error_to_lix_error(error: DataFusionError) -> LixError {
326
- super::error::datafusion_error_to_lix_error(error)
327
- }
328
-
329
- fn lix_error_to_datafusion_error(error: LixError) -> DataFusionError {
330
- super::error::lix_error_to_datafusion_error(error)
331
- }
@@ -1,174 +0,0 @@
1
- use datafusion::sql::parser::Statement as DataFusionStatement;
2
- use datafusion::sql::sqlparser::ast::{
3
- FromTable, ObjectName, Query, SetExpr, Statement as SqlStatement, TableFactor, TableObject,
4
- TableWithJoins,
5
- };
6
-
7
- use crate::LixError;
8
-
9
- #[derive(Debug, Clone, Copy, PartialEq, Eq)]
10
- pub(crate) enum SqlStatementKind {
11
- Read,
12
- Write,
13
- Other,
14
- }
15
-
16
- pub(crate) fn validate_supported_datafusion_statement_ast(
17
- statement: &DataFusionStatement,
18
- ) -> Result<(), LixError> {
19
- match statement {
20
- DataFusionStatement::Statement(statement) => validate_supported_ast_statement(statement),
21
- DataFusionStatement::Explain(explain) => {
22
- if classify_datafusion_statement(explain.statement.as_ref()) == SqlStatementKind::Write
23
- {
24
- return Err(unsupported_sql_error(
25
- "EXPLAIN of write statements is not supported by Lix SQL",
26
- ));
27
- }
28
- validate_supported_datafusion_statement_ast(explain.statement.as_ref())
29
- }
30
- _ => Err(unsupported_sql_error(format!(
31
- "SQL statement is not supported by Lix SQL: {statement}"
32
- ))),
33
- }
34
- }
35
-
36
- pub(crate) fn classify_datafusion_statement(statement: &DataFusionStatement) -> SqlStatementKind {
37
- match statement {
38
- DataFusionStatement::Statement(statement) => classify_ast_statement(statement),
39
- DataFusionStatement::Explain(_) => SqlStatementKind::Read,
40
- _ => SqlStatementKind::Other,
41
- }
42
- }
43
-
44
- pub(crate) fn datafusion_statement_dml_target_table_names(
45
- statement: &DataFusionStatement,
46
- ) -> Vec<String> {
47
- let mut targets = Vec::new();
48
- collect_datafusion_statement_dml_target_table_names(statement, &mut targets);
49
- targets
50
- }
51
-
52
- fn collect_datafusion_statement_dml_target_table_names(
53
- statement: &DataFusionStatement,
54
- targets: &mut Vec<String>,
55
- ) {
56
- match statement {
57
- DataFusionStatement::Statement(statement) => {
58
- collect_dml_target_table_names(statement, targets);
59
- }
60
- DataFusionStatement::Explain(explain) => {
61
- collect_datafusion_statement_dml_target_table_names(
62
- explain.statement.as_ref(),
63
- targets,
64
- );
65
- }
66
- _ => {}
67
- }
68
- }
69
-
70
- fn collect_dml_target_table_names(statement: &SqlStatement, targets: &mut Vec<String>) {
71
- match statement {
72
- SqlStatement::Insert(insert) => {
73
- if let TableObject::TableName(name) = &insert.table {
74
- if let Some(table_name) = object_name_table_part(name) {
75
- targets.push(table_name);
76
- }
77
- }
78
- }
79
- SqlStatement::Update(update) => {
80
- collect_table_with_joins_target(&update.table, targets);
81
- }
82
- SqlStatement::Delete(delete) => {
83
- let tables = match &delete.from {
84
- FromTable::WithFromKeyword(tables) | FromTable::WithoutKeyword(tables) => tables,
85
- };
86
- for table in tables {
87
- collect_table_with_joins_target(table, targets);
88
- }
89
- }
90
- SqlStatement::Explain { statement, .. } => {
91
- collect_dml_target_table_names(statement.as_ref(), targets);
92
- }
93
- _ => {}
94
- }
95
- }
96
-
97
- fn collect_table_with_joins_target(table: &TableWithJoins, targets: &mut Vec<String>) {
98
- if let TableFactor::Table { name, .. } = &table.relation {
99
- if let Some(table_name) = object_name_table_part(name) {
100
- targets.push(table_name);
101
- }
102
- }
103
- }
104
-
105
- fn object_name_table_part(name: &ObjectName) -> Option<String> {
106
- name.0.last().and_then(|part| part.as_ident()).map(|ident| {
107
- if ident.quote_style.is_some() {
108
- ident.value.clone()
109
- } else {
110
- ident.value.to_ascii_lowercase()
111
- }
112
- })
113
- }
114
-
115
- fn classify_ast_statement(statement: &SqlStatement) -> SqlStatementKind {
116
- match statement {
117
- SqlStatement::Insert(_) | SqlStatement::Update(_) | SqlStatement::Delete(_) => {
118
- SqlStatementKind::Write
119
- }
120
- SqlStatement::Query(_) => SqlStatementKind::Read,
121
- SqlStatement::Explain { .. } => SqlStatementKind::Read,
122
- _ => SqlStatementKind::Other,
123
- }
124
- }
125
-
126
- fn validate_supported_ast_statement(statement: &SqlStatement) -> Result<(), LixError> {
127
- match statement {
128
- SqlStatement::Query(query) => validate_supported_query(query),
129
- SqlStatement::Insert(_) | SqlStatement::Update(_) | SqlStatement::Delete(_) => Ok(()),
130
- SqlStatement::Explain { statement, .. } => {
131
- if classify_ast_statement(statement.as_ref()) == SqlStatementKind::Write {
132
- return Err(unsupported_sql_error(
133
- "EXPLAIN of write statements is not supported by Lix SQL",
134
- ));
135
- }
136
- validate_supported_ast_statement(statement)
137
- }
138
- _ => Err(unsupported_sql_error(format!(
139
- "SQL statement is not supported by Lix SQL: {statement}"
140
- ))),
141
- }
142
- }
143
-
144
- fn validate_supported_query(query: &Query) -> Result<(), LixError> {
145
- if query.with.as_ref().is_some_and(|with| with.recursive) {
146
- return Err(
147
- unsupported_sql_error("recursive CTEs are not supported by Lix SQL").with_hint(
148
- "Use explicit commit graph surfaces such as lix_commit, lix_commit_edge, and lix_state_history instead of WITH RECURSIVE.",
149
- ),
150
- );
151
- }
152
-
153
- if let Some(with) = &query.with {
154
- for cte in &with.cte_tables {
155
- validate_supported_query(&cte.query)?;
156
- }
157
- }
158
- validate_supported_set_expr(&query.body)
159
- }
160
-
161
- fn validate_supported_set_expr(expr: &SetExpr) -> Result<(), LixError> {
162
- match expr {
163
- SetExpr::Query(query) => validate_supported_query(query),
164
- SetExpr::SetOperation { left, right, .. } => {
165
- validate_supported_set_expr(left)?;
166
- validate_supported_set_expr(right)
167
- }
168
- _ => Ok(()),
169
- }
170
- }
171
-
172
- fn unsupported_sql_error(message: impl Into<String>) -> LixError {
173
- LixError::new(LixError::CODE_UNSUPPORTED_SQL, message)
174
- }