@lix-js/sdk 0.6.0-preview.5 → 0.6.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (274) hide show
  1. package/README.md +76 -4
  2. package/dist/errors.d.ts +7 -0
  3. package/dist/errors.js +19 -0
  4. package/dist/index.d.ts +4 -5
  5. package/dist/index.js +3 -3
  6. package/dist/native.d.ts +1 -0
  7. package/dist/native.js +47 -0
  8. package/dist/open-lix.d.ts +38 -207
  9. package/dist/open-lix.js +59 -284
  10. package/dist/result.d.ts +18 -0
  11. package/dist/result.js +48 -0
  12. package/dist/types.d.ts +114 -1
  13. package/dist/value.d.ts +28 -0
  14. package/dist/value.js +245 -0
  15. package/package.json +38 -71
  16. package/SKILL.md +0 -507
  17. package/dist/builtin-schemas.d.ts +0 -1
  18. package/dist/builtin-schemas.js +0 -1
  19. package/dist/engine-wasm/index.d.ts +0 -87
  20. package/dist/engine-wasm/index.js +0 -339
  21. package/dist/engine-wasm/wasm/lix_engine.d.ts +0 -79
  22. package/dist/engine-wasm/wasm/lix_engine.js +0 -833
  23. package/dist/engine-wasm/wasm/lix_engine.wasm +0 -0
  24. package/dist/engine-wasm/wasm/lix_engine.wasm.d.ts +0 -27
  25. package/dist/generated/builtin-schemas.d.ts +0 -427
  26. package/dist/generated/builtin-schemas.js +0 -643
  27. package/dist/sqlite/index.d.ts +0 -12
  28. package/dist/sqlite/index.js +0 -359
  29. package/dist-engine-src/README.md +0 -18
  30. package/dist-engine-src/src/backend/capabilities.rs +0 -67
  31. package/dist-engine-src/src/backend/conformance/baseline.rs +0 -1127
  32. package/dist-engine-src/src/backend/conformance/factory.rs +0 -93
  33. package/dist-engine-src/src/backend/conformance/failure_tests.rs +0 -608
  34. package/dist-engine-src/src/backend/conformance/fixtures.rs +0 -26
  35. package/dist-engine-src/src/backend/conformance/mod.rs +0 -75
  36. package/dist-engine-src/src/backend/conformance/model.rs +0 -28
  37. package/dist-engine-src/src/backend/conformance/model_based.rs +0 -257
  38. package/dist-engine-src/src/backend/conformance/persistence.rs +0 -204
  39. package/dist-engine-src/src/backend/conformance/projection.rs +0 -21
  40. package/dist-engine-src/src/backend/conformance/pushdown.rs +0 -24
  41. package/dist-engine-src/src/backend/conformance/runner.rs +0 -90
  42. package/dist-engine-src/src/backend/conformance/scan.rs +0 -24
  43. package/dist-engine-src/src/backend/conformance/write.rs +0 -16
  44. package/dist-engine-src/src/backend/error.rs +0 -94
  45. package/dist-engine-src/src/backend/in_memory.rs +0 -670
  46. package/dist-engine-src/src/backend/mod.rs +0 -39
  47. package/dist-engine-src/src/backend/predicate.rs +0 -80
  48. package/dist-engine-src/src/backend/traits.rs +0 -260
  49. package/dist-engine-src/src/backend/types.rs +0 -239
  50. package/dist-engine-src/src/binary_cas/chunking.rs +0 -31
  51. package/dist-engine-src/src/binary_cas/codec.rs +0 -346
  52. package/dist-engine-src/src/binary_cas/context.rs +0 -139
  53. package/dist-engine-src/src/binary_cas/kv.rs +0 -1038
  54. package/dist-engine-src/src/binary_cas/mod.rs +0 -11
  55. package/dist-engine-src/src/binary_cas/types.rs +0 -121
  56. package/dist-engine-src/src/branch/context.rs +0 -40
  57. package/dist-engine-src/src/branch/lifecycle.rs +0 -221
  58. package/dist-engine-src/src/branch/mod.rs +0 -13
  59. package/dist-engine-src/src/branch/refs.rs +0 -321
  60. package/dist-engine-src/src/branch/stage_rows.rs +0 -67
  61. package/dist-engine-src/src/branch/types.rs +0 -21
  62. package/dist-engine-src/src/catalog/context.rs +0 -412
  63. package/dist-engine-src/src/catalog/mod.rs +0 -10
  64. package/dist-engine-src/src/catalog/schema.rs +0 -4
  65. package/dist-engine-src/src/catalog/snapshot.rs +0 -1114
  66. package/dist-engine-src/src/cel/context.rs +0 -86
  67. package/dist-engine-src/src/cel/error.rs +0 -19
  68. package/dist-engine-src/src/cel/mod.rs +0 -8
  69. package/dist-engine-src/src/cel/provider.rs +0 -9
  70. package/dist-engine-src/src/cel/runtime.rs +0 -167
  71. package/dist-engine-src/src/cel/value.rs +0 -50
  72. package/dist-engine-src/src/changelog/bench_support.rs +0 -785
  73. package/dist-engine-src/src/changelog/change.rs +0 -1
  74. package/dist-engine-src/src/changelog/codec.rs +0 -497
  75. package/dist-engine-src/src/changelog/commit.rs +0 -1
  76. package/dist-engine-src/src/changelog/context.rs +0 -1614
  77. package/dist-engine-src/src/changelog/mod.rs +0 -29
  78. package/dist-engine-src/src/changelog/store.rs +0 -163
  79. package/dist-engine-src/src/changelog/test_support.rs +0 -54
  80. package/dist-engine-src/src/changelog/types.rs +0 -213
  81. package/dist-engine-src/src/commit_graph/context.rs +0 -944
  82. package/dist-engine-src/src/commit_graph/mod.rs +0 -9
  83. package/dist-engine-src/src/commit_graph/types.rs +0 -89
  84. package/dist-engine-src/src/commit_graph/walker.rs +0 -786
  85. package/dist-engine-src/src/common/error.rs +0 -347
  86. package/dist-engine-src/src/common/fingerprint.rs +0 -3
  87. package/dist-engine-src/src/common/fs_path.rs +0 -1336
  88. package/dist-engine-src/src/common/identity.rs +0 -145
  89. package/dist-engine-src/src/common/json_pointer.rs +0 -67
  90. package/dist-engine-src/src/common/metadata.rs +0 -40
  91. package/dist-engine-src/src/common/mod.rs +0 -23
  92. package/dist-engine-src/src/common/types.rs +0 -105
  93. package/dist-engine-src/src/common/wire.rs +0 -222
  94. package/dist-engine-src/src/domain.rs +0 -320
  95. package/dist-engine-src/src/engine.rs +0 -203
  96. package/dist-engine-src/src/entity_pk.rs +0 -402
  97. package/dist-engine-src/src/functions/context.rs +0 -296
  98. package/dist-engine-src/src/functions/deterministic.rs +0 -113
  99. package/dist-engine-src/src/functions/mod.rs +0 -18
  100. package/dist-engine-src/src/functions/provider.rs +0 -130
  101. package/dist-engine-src/src/functions/state.rs +0 -335
  102. package/dist-engine-src/src/functions/types.rs +0 -37
  103. package/dist-engine-src/src/init.rs +0 -692
  104. package/dist-engine-src/src/json_store/compression.rs +0 -77
  105. package/dist-engine-src/src/json_store/context.rs +0 -172
  106. package/dist-engine-src/src/json_store/encoded.rs +0 -15
  107. package/dist-engine-src/src/json_store/mod.rs +0 -38
  108. package/dist-engine-src/src/json_store/store.rs +0 -494
  109. package/dist-engine-src/src/json_store/types.rs +0 -212
  110. package/dist-engine-src/src/lib.rs +0 -92
  111. package/dist-engine-src/src/live_state/context.rs +0 -1883
  112. package/dist-engine-src/src/live_state/mod.rs +0 -21
  113. package/dist-engine-src/src/live_state/overlay.rs +0 -75
  114. package/dist-engine-src/src/live_state/reader.rs +0 -23
  115. package/dist-engine-src/src/live_state/types.rs +0 -231
  116. package/dist-engine-src/src/live_state/visibility.rs +0 -666
  117. package/dist-engine-src/src/plugin/archive.rs +0 -438
  118. package/dist-engine-src/src/plugin/component.rs +0 -183
  119. package/dist-engine-src/src/plugin/install.rs +0 -619
  120. package/dist-engine-src/src/plugin/manifest.rs +0 -516
  121. package/dist-engine-src/src/plugin/materializer.rs +0 -202
  122. package/dist-engine-src/src/plugin/mod.rs +0 -33
  123. package/dist-engine-src/src/plugin/plugin_manifest.json +0 -119
  124. package/dist-engine-src/src/plugin/storage.rs +0 -74
  125. package/dist-engine-src/src/schema/annotations/defaults.rs +0 -275
  126. package/dist-engine-src/src/schema/annotations/mod.rs +0 -1
  127. package/dist-engine-src/src/schema/builtin/lix_account.json +0 -21
  128. package/dist-engine-src/src/schema/builtin/lix_active_account.json +0 -29
  129. package/dist-engine-src/src/schema/builtin/lix_binary_blob_ref.json +0 -29
  130. package/dist-engine-src/src/schema/builtin/lix_branch_descriptor.json +0 -34
  131. package/dist-engine-src/src/schema/builtin/lix_branch_ref.json +0 -48
  132. package/dist-engine-src/src/schema/builtin/lix_change.json +0 -63
  133. package/dist-engine-src/src/schema/builtin/lix_change_author.json +0 -45
  134. package/dist-engine-src/src/schema/builtin/lix_commit.json +0 -24
  135. package/dist-engine-src/src/schema/builtin/lix_commit_edge.json +0 -53
  136. package/dist-engine-src/src/schema/builtin/lix_directory_descriptor.json +0 -52
  137. package/dist-engine-src/src/schema/builtin/lix_file_descriptor.json +0 -52
  138. package/dist-engine-src/src/schema/builtin/lix_key_value.json +0 -40
  139. package/dist-engine-src/src/schema/builtin/lix_label.json +0 -29
  140. package/dist-engine-src/src/schema/builtin/lix_label_assignment.json +0 -74
  141. package/dist-engine-src/src/schema/builtin/lix_registered_schema.json +0 -25
  142. package/dist-engine-src/src/schema/builtin/mod.rs +0 -220
  143. package/dist-engine-src/src/schema/compatibility.rs +0 -787
  144. package/dist-engine-src/src/schema/definition.json +0 -187
  145. package/dist-engine-src/src/schema/definition.rs +0 -742
  146. package/dist-engine-src/src/schema/key.rs +0 -138
  147. package/dist-engine-src/src/schema/mod.rs +0 -20
  148. package/dist-engine-src/src/schema/seed.rs +0 -14
  149. package/dist-engine-src/src/schema/tests.rs +0 -780
  150. package/dist-engine-src/src/session/context.rs +0 -1059
  151. package/dist-engine-src/src/session/create_branch.rs +0 -94
  152. package/dist-engine-src/src/session/execute.rs +0 -681
  153. package/dist-engine-src/src/session/merge/analysis.rs +0 -108
  154. package/dist-engine-src/src/session/merge/branch.rs +0 -417
  155. package/dist-engine-src/src/session/merge/conflicts.rs +0 -63
  156. package/dist-engine-src/src/session/merge/mod.rs +0 -10
  157. package/dist-engine-src/src/session/merge/stats.rs +0 -61
  158. package/dist-engine-src/src/session/mod.rs +0 -30
  159. package/dist-engine-src/src/session/switch_branch.rs +0 -113
  160. package/dist-engine-src/src/session/transaction.rs +0 -557
  161. package/dist-engine-src/src/sql2/bind/classify.rs +0 -102
  162. package/dist-engine-src/src/sql2/bind/error.rs +0 -5
  163. package/dist-engine-src/src/sql2/bind/expr.rs +0 -29
  164. package/dist-engine-src/src/sql2/bind/mod.rs +0 -12
  165. package/dist-engine-src/src/sql2/bind/public_udf.rs +0 -306
  166. package/dist-engine-src/src/sql2/bind/read.rs +0 -65
  167. package/dist-engine-src/src/sql2/bind/statement.rs +0 -2236
  168. package/dist-engine-src/src/sql2/bind/table.rs +0 -273
  169. package/dist-engine-src/src/sql2/bind/write.rs +0 -86
  170. package/dist-engine-src/src/sql2/branch_scope.rs +0 -436
  171. package/dist-engine-src/src/sql2/catalog/capability.rs +0 -20
  172. package/dist-engine-src/src/sql2/catalog/entity_surface.rs +0 -296
  173. package/dist-engine-src/src/sql2/catalog/mod.rs +0 -15
  174. package/dist-engine-src/src/sql2/catalog/registry.rs +0 -556
  175. package/dist-engine-src/src/sql2/catalog/schema.rs +0 -88
  176. package/dist-engine-src/src/sql2/catalog/surface.rs +0 -41
  177. package/dist-engine-src/src/sql2/change_materialization.rs +0 -122
  178. package/dist-engine-src/src/sql2/context.rs +0 -317
  179. package/dist-engine-src/src/sql2/dml.rs +0 -148
  180. package/dist-engine-src/src/sql2/error.rs +0 -215
  181. package/dist-engine-src/src/sql2/exec/bound_public_write.rs +0 -1593
  182. package/dist-engine-src/src/sql2/exec/datafusion.rs +0 -5266
  183. package/dist-engine-src/src/sql2/exec/fast_write.rs +0 -82
  184. package/dist-engine-src/src/sql2/exec/mod.rs +0 -24
  185. package/dist-engine-src/src/sql2/exec/write.rs +0 -661
  186. package/dist-engine-src/src/sql2/filesystem_planner.rs +0 -1485
  187. package/dist-engine-src/src/sql2/filesystem_predicates.rs +0 -159
  188. package/dist-engine-src/src/sql2/filesystem_visibility.rs +0 -383
  189. package/dist-engine-src/src/sql2/history_projection.rs +0 -56
  190. package/dist-engine-src/src/sql2/history_route.rs +0 -661
  191. package/dist-engine-src/src/sql2/mod.rs +0 -52
  192. package/dist-engine-src/src/sql2/optimize/datafusion.rs +0 -1
  193. package/dist-engine-src/src/sql2/optimize/mod.rs +0 -2
  194. package/dist-engine-src/src/sql2/optimize/simple_write.rs +0 -116
  195. package/dist-engine-src/src/sql2/parse/mod.rs +0 -69
  196. package/dist-engine-src/src/sql2/parse/normalize.rs +0 -1
  197. package/dist-engine-src/src/sql2/plan/branch_scope.rs +0 -24
  198. package/dist-engine-src/src/sql2/plan/mod.rs +0 -5
  199. package/dist-engine-src/src/sql2/plan/predicate.rs +0 -22
  200. package/dist-engine-src/src/sql2/plan/write.rs +0 -147
  201. package/dist-engine-src/src/sql2/predicate_typecheck.rs +0 -504
  202. package/dist-engine-src/src/sql2/providers/branch.rs +0 -1206
  203. package/dist-engine-src/src/sql2/providers/change.rs +0 -445
  204. package/dist-engine-src/src/sql2/providers/directory.rs +0 -2422
  205. package/dist-engine-src/src/sql2/providers/directory_history.rs +0 -645
  206. package/dist-engine-src/src/sql2/providers/entity.rs +0 -1484
  207. package/dist-engine-src/src/sql2/providers/entity_history.rs +0 -452
  208. package/dist-engine-src/src/sql2/providers/file.rs +0 -3686
  209. package/dist-engine-src/src/sql2/providers/file_history.rs +0 -924
  210. package/dist-engine-src/src/sql2/providers/history.rs +0 -426
  211. package/dist-engine-src/src/sql2/providers/lix_state.rs +0 -2542
  212. package/dist-engine-src/src/sql2/providers/mod.rs +0 -508
  213. package/dist-engine-src/src/sql2/read_only.rs +0 -63
  214. package/dist-engine-src/src/sql2/record_batch.rs +0 -17
  215. package/dist-engine-src/src/sql2/result_metadata.rs +0 -29
  216. package/dist-engine-src/src/sql2/runtime.rs +0 -60
  217. package/dist-engine-src/src/sql2/session.rs +0 -83
  218. package/dist-engine-src/src/sql2/storage/constraints.rs +0 -1
  219. package/dist-engine-src/src/sql2/storage/mod.rs +0 -1
  220. package/dist-engine-src/src/sql2/test_support/differential.rs +0 -712
  221. package/dist-engine-src/src/sql2/test_support/generators.rs +0 -354
  222. package/dist-engine-src/src/sql2/test_support/mod.rs +0 -2
  223. package/dist-engine-src/src/sql2/udfs/common.rs +0 -295
  224. package/dist-engine-src/src/sql2/udfs/lix_active_branch_commit_id.rs +0 -53
  225. package/dist-engine-src/src/sql2/udfs/lix_empty_blob.rs +0 -47
  226. package/dist-engine-src/src/sql2/udfs/lix_json.rs +0 -100
  227. package/dist-engine-src/src/sql2/udfs/lix_json_get.rs +0 -99
  228. package/dist-engine-src/src/sql2/udfs/lix_json_get_text.rs +0 -99
  229. package/dist-engine-src/src/sql2/udfs/lix_text_decode.rs +0 -82
  230. package/dist-engine-src/src/sql2/udfs/lix_text_encode.rs +0 -85
  231. package/dist-engine-src/src/sql2/udfs/lix_timestamp.rs +0 -76
  232. package/dist-engine-src/src/sql2/udfs/lix_uuid_v7.rs +0 -76
  233. package/dist-engine-src/src/sql2/udfs/mod.rs +0 -86
  234. package/dist-engine-src/src/sql2/write_normalization.rs +0 -368
  235. package/dist-engine-src/src/storage/conformance.rs +0 -399
  236. package/dist-engine-src/src/storage/context.rs +0 -620
  237. package/dist-engine-src/src/storage/mod.rs +0 -52
  238. package/dist-engine-src/src/storage/point.rs +0 -440
  239. package/dist-engine-src/src/storage/read_scope.rs +0 -67
  240. package/dist-engine-src/src/storage/reader.rs +0 -867
  241. package/dist-engine-src/src/storage/scan.rs +0 -784
  242. package/dist-engine-src/src/storage/spaces.rs +0 -236
  243. package/dist-engine-src/src/storage/stats.rs +0 -80
  244. package/dist-engine-src/src/storage/write_set.rs +0 -962
  245. package/dist-engine-src/src/storage_bench.rs +0 -171
  246. package/dist-engine-src/src/test_support.rs +0 -450
  247. package/dist-engine-src/src/tracked_state/bench_support.rs +0 -394
  248. package/dist-engine-src/src/tracked_state/codec.rs +0 -1183
  249. package/dist-engine-src/src/tracked_state/commit_root_rebuild.rs +0 -358
  250. package/dist-engine-src/src/tracked_state/context.rs +0 -2801
  251. package/dist-engine-src/src/tracked_state/diff.rs +0 -2140
  252. package/dist-engine-src/src/tracked_state/merge.rs +0 -478
  253. package/dist-engine-src/src/tracked_state/mod.rs +0 -35
  254. package/dist-engine-src/src/tracked_state/row_materialization.rs +0 -275
  255. package/dist-engine-src/src/tracked_state/storage.rs +0 -427
  256. package/dist-engine-src/src/tracked_state/tree.rs +0 -3063
  257. package/dist-engine-src/src/tracked_state/types.rs +0 -238
  258. package/dist-engine-src/src/transaction/bench_support.rs +0 -407
  259. package/dist-engine-src/src/transaction/commit.rs +0 -1592
  260. package/dist-engine-src/src/transaction/context.rs +0 -1653
  261. package/dist-engine-src/src/transaction/mod.rs +0 -24
  262. package/dist-engine-src/src/transaction/normalization.rs +0 -877
  263. package/dist-engine-src/src/transaction/prep.rs +0 -37
  264. package/dist-engine-src/src/transaction/schema_resolver.rs +0 -163
  265. package/dist-engine-src/src/transaction/staging.rs +0 -1525
  266. package/dist-engine-src/src/transaction/types.rs +0 -403
  267. package/dist-engine-src/src/transaction/validation.rs +0 -5766
  268. package/dist-engine-src/src/untracked_state/codec.rs +0 -615
  269. package/dist-engine-src/src/untracked_state/context.rs +0 -98
  270. package/dist-engine-src/src/untracked_state/materialization.rs +0 -63
  271. package/dist-engine-src/src/untracked_state/mod.rs +0 -15
  272. package/dist-engine-src/src/untracked_state/storage.rs +0 -898
  273. package/dist-engine-src/src/untracked_state/types.rs +0 -146
  274. package/dist-engine-src/src/wasm/mod.rs +0 -60
@@ -1,445 +0,0 @@
1
- use std::any::Any;
2
- use std::sync::Arc;
3
-
4
- use async_trait::async_trait;
5
- use datafusion::arrow::array::{ArrayRef, StringArray};
6
- use datafusion::arrow::datatypes::{DataType, Field, Schema, SchemaRef};
7
- use datafusion::arrow::record_batch::RecordBatch;
8
- use datafusion::catalog::{Session, TableProvider};
9
- use datafusion::common::{DataFusionError, Result};
10
- use datafusion::datasource::TableType;
11
- use datafusion::execution::TaskContext;
12
- use datafusion::logical_expr::{Expr, TableProviderFilterPushDown};
13
- use datafusion::physical_expr::EquivalenceProperties;
14
- use datafusion::physical_plan::execution_plan::{Boundedness, EmissionType, PlanProperties};
15
- use datafusion::physical_plan::stream::RecordBatchStreamAdapter;
16
- use datafusion::physical_plan::{
17
- DisplayAs, DisplayFormatType, ExecutionPlan, Partitioning, SendableRecordBatchStream,
18
- };
19
- use futures_util::stream;
20
-
21
- use crate::changelog::{
22
- ChangeRecord, ChangeScanRequest, ChangelogContext, ChangelogReader, CommitLoadEntry,
23
- CommitProjection, CommitScanRequest,
24
- };
25
- use crate::serialize_row_metadata;
26
- use crate::LixError;
27
-
28
- use crate::sql2::change_materialization::{
29
- materialize_changelog_change_record, materialize_commit_graph_change, MaterializedChange,
30
- };
31
- use crate::sql2::record_batch::record_batch_with_row_count;
32
- use crate::sql2::result_metadata::json_field;
33
- use crate::sql2::SqlChangelogQuerySource;
34
- use crate::storage::StorageRead;
35
-
36
- pub(super) async fn register_lix_change_read_provider<S>(
37
- session: &datafusion::prelude::SessionContext,
38
- surface_name: &str,
39
- query_source: SqlChangelogQuerySource<S>,
40
- ) -> Result<(), LixError>
41
- where
42
- S: StorageRead + Clone + Send + Sync + 'static,
43
- {
44
- session
45
- .register_table(surface_name, Arc::new(LixChangeProvider::new(query_source)))
46
- .map_err(datafusion_error_to_lix_error)?;
47
- Ok(())
48
- }
49
-
50
- /// SQL provider for `lix_change`.
51
- ///
52
- /// `lix_change` is the unscoped durable change surface: it scans direct
53
- /// `changelog.change` records and unions derived `lix_commit` changes from
54
- /// `changelog.commit`. It does not prove branch reachability. History
55
- /// providers are the reachability-aware SQL surfaces.
56
- struct LixChangeProvider<S> {
57
- schema: SchemaRef,
58
- query_source: SqlChangelogQuerySource<S>,
59
- }
60
-
61
- impl<S> std::fmt::Debug for LixChangeProvider<S> {
62
- fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
63
- f.debug_struct("LixChangeProvider").finish()
64
- }
65
- }
66
-
67
- impl<S> LixChangeProvider<S> {
68
- fn new(query_source: SqlChangelogQuerySource<S>) -> Self {
69
- Self {
70
- schema: lix_change_schema(),
71
- query_source,
72
- }
73
- }
74
- }
75
-
76
- #[async_trait]
77
- impl<S> TableProvider for LixChangeProvider<S>
78
- where
79
- S: StorageRead + Clone + Send + Sync + 'static,
80
- {
81
- fn as_any(&self) -> &dyn Any {
82
- self
83
- }
84
-
85
- fn schema(&self) -> SchemaRef {
86
- Arc::clone(&self.schema)
87
- }
88
-
89
- fn table_type(&self) -> TableType {
90
- TableType::Base
91
- }
92
-
93
- fn supports_filters_pushdown(
94
- &self,
95
- filters: &[&Expr],
96
- ) -> Result<Vec<TableProviderFilterPushDown>> {
97
- Ok(filters
98
- .iter()
99
- .map(|_| TableProviderFilterPushDown::Unsupported)
100
- .collect())
101
- }
102
-
103
- async fn scan(
104
- &self,
105
- _state: &dyn Session,
106
- projection: Option<&Vec<usize>>,
107
- filters: &[Expr],
108
- limit: Option<usize>,
109
- ) -> Result<Arc<dyn ExecutionPlan>> {
110
- let pushed_limit = if filters.is_empty() { limit } else { None };
111
- Ok(Arc::new(LixChangeScanExec::new(
112
- self.query_source.clone(),
113
- projected_schema(&self.schema, projection),
114
- projection.cloned(),
115
- pushed_limit,
116
- )))
117
- }
118
- }
119
-
120
- struct LixChangeScanExec<S> {
121
- query_source: SqlChangelogQuerySource<S>,
122
- schema: SchemaRef,
123
- projection: Option<Vec<usize>>,
124
- limit: Option<usize>,
125
- properties: Arc<PlanProperties>,
126
- }
127
-
128
- impl<S> std::fmt::Debug for LixChangeScanExec<S> {
129
- fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
130
- f.debug_struct("LixChangeScanExec").finish()
131
- }
132
- }
133
-
134
- impl<S> LixChangeScanExec<S> {
135
- fn new(
136
- query_source: SqlChangelogQuerySource<S>,
137
- schema: SchemaRef,
138
- projection: Option<Vec<usize>>,
139
- limit: Option<usize>,
140
- ) -> Self {
141
- let properties = PlanProperties::new(
142
- EquivalenceProperties::new(schema.clone()),
143
- Partitioning::UnknownPartitioning(1),
144
- EmissionType::Incremental,
145
- Boundedness::Bounded,
146
- );
147
- Self {
148
- query_source,
149
- schema,
150
- projection,
151
- limit,
152
- properties: Arc::new(properties),
153
- }
154
- }
155
- }
156
-
157
- impl<S> DisplayAs for LixChangeScanExec<S> {
158
- fn fmt_as(&self, t: DisplayFormatType, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
159
- match t {
160
- DisplayFormatType::Default | DisplayFormatType::Verbose => {
161
- write!(f, "LixChangeScanExec")
162
- }
163
- DisplayFormatType::TreeRender => write!(f, "LixChangeScanExec"),
164
- }
165
- }
166
- }
167
-
168
- impl<S> ExecutionPlan for LixChangeScanExec<S>
169
- where
170
- S: StorageRead + Clone + Send + Sync + 'static,
171
- {
172
- fn name(&self) -> &str {
173
- "LixChangeScanExec"
174
- }
175
-
176
- fn as_any(&self) -> &dyn Any {
177
- self
178
- }
179
-
180
- fn properties(&self) -> &Arc<PlanProperties> {
181
- &self.properties
182
- }
183
-
184
- fn children(&self) -> Vec<&Arc<dyn ExecutionPlan>> {
185
- Vec::new()
186
- }
187
-
188
- fn with_new_children(
189
- self: Arc<Self>,
190
- children: Vec<Arc<dyn ExecutionPlan>>,
191
- ) -> Result<Arc<dyn ExecutionPlan>> {
192
- if !children.is_empty() {
193
- return Err(DataFusionError::Execution(
194
- "LixChangeScanExec does not accept children".to_string(),
195
- ));
196
- }
197
- Ok(self)
198
- }
199
-
200
- fn execute(
201
- &self,
202
- partition: usize,
203
- _context: Arc<TaskContext>,
204
- ) -> Result<SendableRecordBatchStream> {
205
- if partition != 0 {
206
- return Err(DataFusionError::Execution(format!(
207
- "LixChangeScanExec only exposes one partition, got {partition}"
208
- )));
209
- }
210
-
211
- let query_source = self.query_source.clone();
212
- let projection = change_projection_for_scan(self.projection.as_ref());
213
- let limit = self.limit;
214
- let schema = Arc::clone(&self.schema);
215
- let stream = stream::once(async move {
216
- let mut json_reader = query_source.json_reader;
217
- let canonical_changes = scan_changelog_changes(query_source.store, limit)
218
- .await
219
- .map_err(lix_error_to_datafusion_error)?;
220
- let mut changes = Vec::with_capacity(canonical_changes.len());
221
- for change in canonical_changes {
222
- match change {
223
- LixChangeRow::Direct(change) => changes.push(
224
- materialize_changelog_change_record(&mut json_reader, change)
225
- .await
226
- .map_err(lix_error_to_datafusion_error)?,
227
- ),
228
- LixChangeRow::DerivedCommit(change) => changes.push(
229
- materialize_commit_graph_change(&mut json_reader, change)
230
- .await
231
- .map_err(lix_error_to_datafusion_error)?,
232
- ),
233
- }
234
- }
235
- change_record_batch(&projection, &changes)
236
- });
237
- Ok(Box::pin(RecordBatchStreamAdapter::new(schema, stream)))
238
- }
239
- }
240
-
241
- async fn scan_changelog_changes<S>(
242
- store: S,
243
- limit: Option<usize>,
244
- ) -> Result<Vec<LixChangeRow>, LixError>
245
- where
246
- S: StorageRead + Clone + Send + Sync + 'static,
247
- {
248
- let mut reader = ChangelogContext::new().reader(store);
249
- let mut changes = Vec::<LixChangeRow>::new();
250
- let mut start_after = None::<String>;
251
- loop {
252
- let scan = reader
253
- .scan_changes(ChangeScanRequest {
254
- start_after: start_after.as_deref(),
255
- limit: Some(1024),
256
- })
257
- .await?;
258
- changes.extend(scan.entries.into_iter().map(LixChangeRow::Direct));
259
- let Some(next) = scan.next_start_after else {
260
- break;
261
- };
262
- start_after = Some(next);
263
- }
264
- let mut start_after = None::<String>;
265
- loop {
266
- let scan = reader
267
- .scan_commits(CommitScanRequest {
268
- start_after: start_after.as_deref(),
269
- limit: Some(1024),
270
- projection: CommitProjection::Record,
271
- })
272
- .await?;
273
- for entry in scan.entries {
274
- let CommitLoadEntry::Record(commit) = entry else {
275
- continue;
276
- };
277
- changes.push(LixChangeRow::DerivedCommit(commit_record_canonical_change(
278
- &commit,
279
- )));
280
- }
281
- let Some(next) = scan.next_start_after else {
282
- break;
283
- };
284
- start_after = Some(next);
285
- }
286
- changes.sort_by(|left, right| left.change_id().cmp(right.change_id()));
287
- if let Some(limit) = limit {
288
- changes.truncate(limit);
289
- }
290
- Ok(changes)
291
- }
292
-
293
- enum LixChangeRow {
294
- Direct(ChangeRecord),
295
- DerivedCommit(crate::commit_graph::CommitGraphChange),
296
- }
297
-
298
- impl LixChangeRow {
299
- fn change_id(&self) -> &str {
300
- match self {
301
- Self::Direct(change) => &change.change_id,
302
- Self::DerivedCommit(change) => &change.id,
303
- }
304
- }
305
- }
306
-
307
- fn commit_record_canonical_change(
308
- commit: &crate::changelog::CommitRecord,
309
- ) -> crate::commit_graph::CommitGraphChange {
310
- let snapshot_content = serde_json::to_string(&serde_json::json!({
311
- "id": commit.commit_id,
312
- }))
313
- .expect("lix_commit snapshot serialization should not fail");
314
- crate::commit_graph::CommitGraphChange {
315
- id: commit.change_id.clone(),
316
- entity_pk: crate::entity_pk::EntityPk::single(&commit.commit_id),
317
- schema_key: "lix_commit".to_string(),
318
- file_id: None,
319
- snapshot_ref: Some(crate::json_store::JsonRef::for_content(
320
- snapshot_content.as_bytes(),
321
- )),
322
- metadata_ref: None,
323
- created_at: commit.created_at.clone(),
324
- }
325
- }
326
-
327
- #[derive(Debug, Clone, Copy)]
328
- enum ChangeColumn {
329
- Id,
330
- EntityPk,
331
- SchemaKey,
332
- FileId,
333
- Metadata,
334
- CreatedAt,
335
- SnapshotContent,
336
- }
337
-
338
- pub(super) fn lix_change_schema() -> SchemaRef {
339
- Arc::new(Schema::new(vec![
340
- Field::new("id", DataType::Utf8, false),
341
- json_field("entity_pk", false),
342
- Field::new("schema_key", DataType::Utf8, false),
343
- Field::new("file_id", DataType::Utf8, true),
344
- json_field("metadata", true),
345
- Field::new("created_at", DataType::Utf8, false),
346
- json_field("snapshot_content", true),
347
- ]))
348
- }
349
-
350
- fn change_projection_for_scan(projection: Option<&Vec<usize>>) -> Vec<ChangeColumn> {
351
- let all_columns = vec![
352
- ChangeColumn::Id,
353
- ChangeColumn::EntityPk,
354
- ChangeColumn::SchemaKey,
355
- ChangeColumn::FileId,
356
- ChangeColumn::Metadata,
357
- ChangeColumn::CreatedAt,
358
- ChangeColumn::SnapshotContent,
359
- ];
360
- projection.map_or(all_columns.clone(), |indices| {
361
- indices
362
- .iter()
363
- .filter_map(|index| all_columns.get(*index).copied())
364
- .collect()
365
- })
366
- }
367
-
368
- fn projected_schema(schema: &SchemaRef, projection: Option<&Vec<usize>>) -> SchemaRef {
369
- match projection {
370
- Some(projection) => Arc::new(schema.project(projection).expect("projection is valid")),
371
- None => Arc::clone(schema),
372
- }
373
- }
374
-
375
- fn change_record_batch(
376
- projection: &[ChangeColumn],
377
- changes: &[MaterializedChange],
378
- ) -> Result<RecordBatch> {
379
- let arrays = projection
380
- .iter()
381
- .map(|column| match column {
382
- ChangeColumn::Id => string_array(changes.iter().map(|row| Some(row.id.as_str()))),
383
- ChangeColumn::EntityPk => Arc::new(StringArray::from(
384
- changes
385
- .iter()
386
- .map(|row| {
387
- Some(
388
- row.entity_pk
389
- .as_json_array_text()
390
- .expect("canonical change entity primary key should project"),
391
- )
392
- })
393
- .collect::<Vec<_>>(),
394
- )) as ArrayRef,
395
- ChangeColumn::SchemaKey => {
396
- string_array(changes.iter().map(|row| Some(row.schema_key.as_str())))
397
- }
398
- ChangeColumn::FileId => string_array(changes.iter().map(|row| row.file_id.as_deref())),
399
- ChangeColumn::Metadata => Arc::new(StringArray::from(
400
- changes
401
- .iter()
402
- .map(|row| row.metadata.as_ref().map(serialize_row_metadata))
403
- .collect::<Vec<_>>(),
404
- )),
405
- ChangeColumn::CreatedAt => {
406
- string_array(changes.iter().map(|row| Some(row.created_at.as_str())))
407
- }
408
- ChangeColumn::SnapshotContent => {
409
- string_array(changes.iter().map(|row| row.snapshot_content.as_deref()))
410
- }
411
- })
412
- .collect::<Vec<_>>();
413
- record_batch_with_row_count(change_schema(projection), arrays, changes.len()).map_err(|error| {
414
- DataFusionError::Execution(format!("failed to build lix_change batch: {error}"))
415
- })
416
- }
417
-
418
- fn change_schema(projection: &[ChangeColumn]) -> SchemaRef {
419
- Arc::new(Schema::new(
420
- projection
421
- .iter()
422
- .map(|column| match column {
423
- ChangeColumn::Id => Field::new("id", DataType::Utf8, false),
424
- ChangeColumn::EntityPk => json_field("entity_pk", false),
425
- ChangeColumn::SchemaKey => Field::new("schema_key", DataType::Utf8, false),
426
- ChangeColumn::FileId => Field::new("file_id", DataType::Utf8, true),
427
- ChangeColumn::Metadata => json_field("metadata", true),
428
- ChangeColumn::CreatedAt => Field::new("created_at", DataType::Utf8, false),
429
- ChangeColumn::SnapshotContent => json_field("snapshot_content", true),
430
- })
431
- .collect::<Vec<_>>(),
432
- ))
433
- }
434
-
435
- fn string_array<'a>(values: impl Iterator<Item = Option<&'a str>>) -> ArrayRef {
436
- Arc::new(StringArray::from(values.collect::<Vec<_>>())) as ArrayRef
437
- }
438
-
439
- fn datafusion_error_to_lix_error(error: DataFusionError) -> LixError {
440
- crate::sql2::error::datafusion_error_to_lix_error(error)
441
- }
442
-
443
- fn lix_error_to_datafusion_error(error: LixError) -> DataFusionError {
444
- crate::sql2::error::lix_error_to_datafusion_error(error)
445
- }