@lix-js/sdk 0.6.0-preview.5 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (274) hide show
  1. package/README.md +76 -4
  2. package/dist/errors.d.ts +7 -0
  3. package/dist/errors.js +19 -0
  4. package/dist/index.d.ts +4 -5
  5. package/dist/index.js +3 -3
  6. package/dist/native.d.ts +1 -0
  7. package/dist/native.js +47 -0
  8. package/dist/open-lix.d.ts +38 -207
  9. package/dist/open-lix.js +59 -284
  10. package/dist/result.d.ts +18 -0
  11. package/dist/result.js +48 -0
  12. package/dist/types.d.ts +114 -1
  13. package/dist/value.d.ts +28 -0
  14. package/dist/value.js +245 -0
  15. package/package.json +38 -71
  16. package/SKILL.md +0 -507
  17. package/dist/builtin-schemas.d.ts +0 -1
  18. package/dist/builtin-schemas.js +0 -1
  19. package/dist/engine-wasm/index.d.ts +0 -87
  20. package/dist/engine-wasm/index.js +0 -339
  21. package/dist/engine-wasm/wasm/lix_engine.d.ts +0 -79
  22. package/dist/engine-wasm/wasm/lix_engine.js +0 -833
  23. package/dist/engine-wasm/wasm/lix_engine.wasm +0 -0
  24. package/dist/engine-wasm/wasm/lix_engine.wasm.d.ts +0 -27
  25. package/dist/generated/builtin-schemas.d.ts +0 -427
  26. package/dist/generated/builtin-schemas.js +0 -643
  27. package/dist/sqlite/index.d.ts +0 -12
  28. package/dist/sqlite/index.js +0 -359
  29. package/dist-engine-src/README.md +0 -18
  30. package/dist-engine-src/src/backend/capabilities.rs +0 -67
  31. package/dist-engine-src/src/backend/conformance/baseline.rs +0 -1127
  32. package/dist-engine-src/src/backend/conformance/factory.rs +0 -93
  33. package/dist-engine-src/src/backend/conformance/failure_tests.rs +0 -608
  34. package/dist-engine-src/src/backend/conformance/fixtures.rs +0 -26
  35. package/dist-engine-src/src/backend/conformance/mod.rs +0 -75
  36. package/dist-engine-src/src/backend/conformance/model.rs +0 -28
  37. package/dist-engine-src/src/backend/conformance/model_based.rs +0 -257
  38. package/dist-engine-src/src/backend/conformance/persistence.rs +0 -204
  39. package/dist-engine-src/src/backend/conformance/projection.rs +0 -21
  40. package/dist-engine-src/src/backend/conformance/pushdown.rs +0 -24
  41. package/dist-engine-src/src/backend/conformance/runner.rs +0 -90
  42. package/dist-engine-src/src/backend/conformance/scan.rs +0 -24
  43. package/dist-engine-src/src/backend/conformance/write.rs +0 -16
  44. package/dist-engine-src/src/backend/error.rs +0 -94
  45. package/dist-engine-src/src/backend/in_memory.rs +0 -670
  46. package/dist-engine-src/src/backend/mod.rs +0 -39
  47. package/dist-engine-src/src/backend/predicate.rs +0 -80
  48. package/dist-engine-src/src/backend/traits.rs +0 -260
  49. package/dist-engine-src/src/backend/types.rs +0 -239
  50. package/dist-engine-src/src/binary_cas/chunking.rs +0 -31
  51. package/dist-engine-src/src/binary_cas/codec.rs +0 -346
  52. package/dist-engine-src/src/binary_cas/context.rs +0 -139
  53. package/dist-engine-src/src/binary_cas/kv.rs +0 -1038
  54. package/dist-engine-src/src/binary_cas/mod.rs +0 -11
  55. package/dist-engine-src/src/binary_cas/types.rs +0 -121
  56. package/dist-engine-src/src/branch/context.rs +0 -40
  57. package/dist-engine-src/src/branch/lifecycle.rs +0 -221
  58. package/dist-engine-src/src/branch/mod.rs +0 -13
  59. package/dist-engine-src/src/branch/refs.rs +0 -321
  60. package/dist-engine-src/src/branch/stage_rows.rs +0 -67
  61. package/dist-engine-src/src/branch/types.rs +0 -21
  62. package/dist-engine-src/src/catalog/context.rs +0 -412
  63. package/dist-engine-src/src/catalog/mod.rs +0 -10
  64. package/dist-engine-src/src/catalog/schema.rs +0 -4
  65. package/dist-engine-src/src/catalog/snapshot.rs +0 -1114
  66. package/dist-engine-src/src/cel/context.rs +0 -86
  67. package/dist-engine-src/src/cel/error.rs +0 -19
  68. package/dist-engine-src/src/cel/mod.rs +0 -8
  69. package/dist-engine-src/src/cel/provider.rs +0 -9
  70. package/dist-engine-src/src/cel/runtime.rs +0 -167
  71. package/dist-engine-src/src/cel/value.rs +0 -50
  72. package/dist-engine-src/src/changelog/bench_support.rs +0 -785
  73. package/dist-engine-src/src/changelog/change.rs +0 -1
  74. package/dist-engine-src/src/changelog/codec.rs +0 -497
  75. package/dist-engine-src/src/changelog/commit.rs +0 -1
  76. package/dist-engine-src/src/changelog/context.rs +0 -1614
  77. package/dist-engine-src/src/changelog/mod.rs +0 -29
  78. package/dist-engine-src/src/changelog/store.rs +0 -163
  79. package/dist-engine-src/src/changelog/test_support.rs +0 -54
  80. package/dist-engine-src/src/changelog/types.rs +0 -213
  81. package/dist-engine-src/src/commit_graph/context.rs +0 -944
  82. package/dist-engine-src/src/commit_graph/mod.rs +0 -9
  83. package/dist-engine-src/src/commit_graph/types.rs +0 -89
  84. package/dist-engine-src/src/commit_graph/walker.rs +0 -786
  85. package/dist-engine-src/src/common/error.rs +0 -347
  86. package/dist-engine-src/src/common/fingerprint.rs +0 -3
  87. package/dist-engine-src/src/common/fs_path.rs +0 -1336
  88. package/dist-engine-src/src/common/identity.rs +0 -145
  89. package/dist-engine-src/src/common/json_pointer.rs +0 -67
  90. package/dist-engine-src/src/common/metadata.rs +0 -40
  91. package/dist-engine-src/src/common/mod.rs +0 -23
  92. package/dist-engine-src/src/common/types.rs +0 -105
  93. package/dist-engine-src/src/common/wire.rs +0 -222
  94. package/dist-engine-src/src/domain.rs +0 -320
  95. package/dist-engine-src/src/engine.rs +0 -203
  96. package/dist-engine-src/src/entity_pk.rs +0 -402
  97. package/dist-engine-src/src/functions/context.rs +0 -296
  98. package/dist-engine-src/src/functions/deterministic.rs +0 -113
  99. package/dist-engine-src/src/functions/mod.rs +0 -18
  100. package/dist-engine-src/src/functions/provider.rs +0 -130
  101. package/dist-engine-src/src/functions/state.rs +0 -335
  102. package/dist-engine-src/src/functions/types.rs +0 -37
  103. package/dist-engine-src/src/init.rs +0 -692
  104. package/dist-engine-src/src/json_store/compression.rs +0 -77
  105. package/dist-engine-src/src/json_store/context.rs +0 -172
  106. package/dist-engine-src/src/json_store/encoded.rs +0 -15
  107. package/dist-engine-src/src/json_store/mod.rs +0 -38
  108. package/dist-engine-src/src/json_store/store.rs +0 -494
  109. package/dist-engine-src/src/json_store/types.rs +0 -212
  110. package/dist-engine-src/src/lib.rs +0 -92
  111. package/dist-engine-src/src/live_state/context.rs +0 -1883
  112. package/dist-engine-src/src/live_state/mod.rs +0 -21
  113. package/dist-engine-src/src/live_state/overlay.rs +0 -75
  114. package/dist-engine-src/src/live_state/reader.rs +0 -23
  115. package/dist-engine-src/src/live_state/types.rs +0 -231
  116. package/dist-engine-src/src/live_state/visibility.rs +0 -666
  117. package/dist-engine-src/src/plugin/archive.rs +0 -438
  118. package/dist-engine-src/src/plugin/component.rs +0 -183
  119. package/dist-engine-src/src/plugin/install.rs +0 -619
  120. package/dist-engine-src/src/plugin/manifest.rs +0 -516
  121. package/dist-engine-src/src/plugin/materializer.rs +0 -202
  122. package/dist-engine-src/src/plugin/mod.rs +0 -33
  123. package/dist-engine-src/src/plugin/plugin_manifest.json +0 -119
  124. package/dist-engine-src/src/plugin/storage.rs +0 -74
  125. package/dist-engine-src/src/schema/annotations/defaults.rs +0 -275
  126. package/dist-engine-src/src/schema/annotations/mod.rs +0 -1
  127. package/dist-engine-src/src/schema/builtin/lix_account.json +0 -21
  128. package/dist-engine-src/src/schema/builtin/lix_active_account.json +0 -29
  129. package/dist-engine-src/src/schema/builtin/lix_binary_blob_ref.json +0 -29
  130. package/dist-engine-src/src/schema/builtin/lix_branch_descriptor.json +0 -34
  131. package/dist-engine-src/src/schema/builtin/lix_branch_ref.json +0 -48
  132. package/dist-engine-src/src/schema/builtin/lix_change.json +0 -63
  133. package/dist-engine-src/src/schema/builtin/lix_change_author.json +0 -45
  134. package/dist-engine-src/src/schema/builtin/lix_commit.json +0 -24
  135. package/dist-engine-src/src/schema/builtin/lix_commit_edge.json +0 -53
  136. package/dist-engine-src/src/schema/builtin/lix_directory_descriptor.json +0 -52
  137. package/dist-engine-src/src/schema/builtin/lix_file_descriptor.json +0 -52
  138. package/dist-engine-src/src/schema/builtin/lix_key_value.json +0 -40
  139. package/dist-engine-src/src/schema/builtin/lix_label.json +0 -29
  140. package/dist-engine-src/src/schema/builtin/lix_label_assignment.json +0 -74
  141. package/dist-engine-src/src/schema/builtin/lix_registered_schema.json +0 -25
  142. package/dist-engine-src/src/schema/builtin/mod.rs +0 -220
  143. package/dist-engine-src/src/schema/compatibility.rs +0 -787
  144. package/dist-engine-src/src/schema/definition.json +0 -187
  145. package/dist-engine-src/src/schema/definition.rs +0 -742
  146. package/dist-engine-src/src/schema/key.rs +0 -138
  147. package/dist-engine-src/src/schema/mod.rs +0 -20
  148. package/dist-engine-src/src/schema/seed.rs +0 -14
  149. package/dist-engine-src/src/schema/tests.rs +0 -780
  150. package/dist-engine-src/src/session/context.rs +0 -1059
  151. package/dist-engine-src/src/session/create_branch.rs +0 -94
  152. package/dist-engine-src/src/session/execute.rs +0 -681
  153. package/dist-engine-src/src/session/merge/analysis.rs +0 -108
  154. package/dist-engine-src/src/session/merge/branch.rs +0 -417
  155. package/dist-engine-src/src/session/merge/conflicts.rs +0 -63
  156. package/dist-engine-src/src/session/merge/mod.rs +0 -10
  157. package/dist-engine-src/src/session/merge/stats.rs +0 -61
  158. package/dist-engine-src/src/session/mod.rs +0 -30
  159. package/dist-engine-src/src/session/switch_branch.rs +0 -113
  160. package/dist-engine-src/src/session/transaction.rs +0 -557
  161. package/dist-engine-src/src/sql2/bind/classify.rs +0 -102
  162. package/dist-engine-src/src/sql2/bind/error.rs +0 -5
  163. package/dist-engine-src/src/sql2/bind/expr.rs +0 -29
  164. package/dist-engine-src/src/sql2/bind/mod.rs +0 -12
  165. package/dist-engine-src/src/sql2/bind/public_udf.rs +0 -306
  166. package/dist-engine-src/src/sql2/bind/read.rs +0 -65
  167. package/dist-engine-src/src/sql2/bind/statement.rs +0 -2236
  168. package/dist-engine-src/src/sql2/bind/table.rs +0 -273
  169. package/dist-engine-src/src/sql2/bind/write.rs +0 -86
  170. package/dist-engine-src/src/sql2/branch_scope.rs +0 -436
  171. package/dist-engine-src/src/sql2/catalog/capability.rs +0 -20
  172. package/dist-engine-src/src/sql2/catalog/entity_surface.rs +0 -296
  173. package/dist-engine-src/src/sql2/catalog/mod.rs +0 -15
  174. package/dist-engine-src/src/sql2/catalog/registry.rs +0 -556
  175. package/dist-engine-src/src/sql2/catalog/schema.rs +0 -88
  176. package/dist-engine-src/src/sql2/catalog/surface.rs +0 -41
  177. package/dist-engine-src/src/sql2/change_materialization.rs +0 -122
  178. package/dist-engine-src/src/sql2/context.rs +0 -317
  179. package/dist-engine-src/src/sql2/dml.rs +0 -148
  180. package/dist-engine-src/src/sql2/error.rs +0 -215
  181. package/dist-engine-src/src/sql2/exec/bound_public_write.rs +0 -1593
  182. package/dist-engine-src/src/sql2/exec/datafusion.rs +0 -5266
  183. package/dist-engine-src/src/sql2/exec/fast_write.rs +0 -82
  184. package/dist-engine-src/src/sql2/exec/mod.rs +0 -24
  185. package/dist-engine-src/src/sql2/exec/write.rs +0 -661
  186. package/dist-engine-src/src/sql2/filesystem_planner.rs +0 -1485
  187. package/dist-engine-src/src/sql2/filesystem_predicates.rs +0 -159
  188. package/dist-engine-src/src/sql2/filesystem_visibility.rs +0 -383
  189. package/dist-engine-src/src/sql2/history_projection.rs +0 -56
  190. package/dist-engine-src/src/sql2/history_route.rs +0 -661
  191. package/dist-engine-src/src/sql2/mod.rs +0 -52
  192. package/dist-engine-src/src/sql2/optimize/datafusion.rs +0 -1
  193. package/dist-engine-src/src/sql2/optimize/mod.rs +0 -2
  194. package/dist-engine-src/src/sql2/optimize/simple_write.rs +0 -116
  195. package/dist-engine-src/src/sql2/parse/mod.rs +0 -69
  196. package/dist-engine-src/src/sql2/parse/normalize.rs +0 -1
  197. package/dist-engine-src/src/sql2/plan/branch_scope.rs +0 -24
  198. package/dist-engine-src/src/sql2/plan/mod.rs +0 -5
  199. package/dist-engine-src/src/sql2/plan/predicate.rs +0 -22
  200. package/dist-engine-src/src/sql2/plan/write.rs +0 -147
  201. package/dist-engine-src/src/sql2/predicate_typecheck.rs +0 -504
  202. package/dist-engine-src/src/sql2/providers/branch.rs +0 -1206
  203. package/dist-engine-src/src/sql2/providers/change.rs +0 -445
  204. package/dist-engine-src/src/sql2/providers/directory.rs +0 -2422
  205. package/dist-engine-src/src/sql2/providers/directory_history.rs +0 -645
  206. package/dist-engine-src/src/sql2/providers/entity.rs +0 -1484
  207. package/dist-engine-src/src/sql2/providers/entity_history.rs +0 -452
  208. package/dist-engine-src/src/sql2/providers/file.rs +0 -3686
  209. package/dist-engine-src/src/sql2/providers/file_history.rs +0 -924
  210. package/dist-engine-src/src/sql2/providers/history.rs +0 -426
  211. package/dist-engine-src/src/sql2/providers/lix_state.rs +0 -2542
  212. package/dist-engine-src/src/sql2/providers/mod.rs +0 -508
  213. package/dist-engine-src/src/sql2/read_only.rs +0 -63
  214. package/dist-engine-src/src/sql2/record_batch.rs +0 -17
  215. package/dist-engine-src/src/sql2/result_metadata.rs +0 -29
  216. package/dist-engine-src/src/sql2/runtime.rs +0 -60
  217. package/dist-engine-src/src/sql2/session.rs +0 -83
  218. package/dist-engine-src/src/sql2/storage/constraints.rs +0 -1
  219. package/dist-engine-src/src/sql2/storage/mod.rs +0 -1
  220. package/dist-engine-src/src/sql2/test_support/differential.rs +0 -712
  221. package/dist-engine-src/src/sql2/test_support/generators.rs +0 -354
  222. package/dist-engine-src/src/sql2/test_support/mod.rs +0 -2
  223. package/dist-engine-src/src/sql2/udfs/common.rs +0 -295
  224. package/dist-engine-src/src/sql2/udfs/lix_active_branch_commit_id.rs +0 -53
  225. package/dist-engine-src/src/sql2/udfs/lix_empty_blob.rs +0 -47
  226. package/dist-engine-src/src/sql2/udfs/lix_json.rs +0 -100
  227. package/dist-engine-src/src/sql2/udfs/lix_json_get.rs +0 -99
  228. package/dist-engine-src/src/sql2/udfs/lix_json_get_text.rs +0 -99
  229. package/dist-engine-src/src/sql2/udfs/lix_text_decode.rs +0 -82
  230. package/dist-engine-src/src/sql2/udfs/lix_text_encode.rs +0 -85
  231. package/dist-engine-src/src/sql2/udfs/lix_timestamp.rs +0 -76
  232. package/dist-engine-src/src/sql2/udfs/lix_uuid_v7.rs +0 -76
  233. package/dist-engine-src/src/sql2/udfs/mod.rs +0 -86
  234. package/dist-engine-src/src/sql2/write_normalization.rs +0 -368
  235. package/dist-engine-src/src/storage/conformance.rs +0 -399
  236. package/dist-engine-src/src/storage/context.rs +0 -620
  237. package/dist-engine-src/src/storage/mod.rs +0 -52
  238. package/dist-engine-src/src/storage/point.rs +0 -440
  239. package/dist-engine-src/src/storage/read_scope.rs +0 -67
  240. package/dist-engine-src/src/storage/reader.rs +0 -867
  241. package/dist-engine-src/src/storage/scan.rs +0 -784
  242. package/dist-engine-src/src/storage/spaces.rs +0 -236
  243. package/dist-engine-src/src/storage/stats.rs +0 -80
  244. package/dist-engine-src/src/storage/write_set.rs +0 -962
  245. package/dist-engine-src/src/storage_bench.rs +0 -171
  246. package/dist-engine-src/src/test_support.rs +0 -450
  247. package/dist-engine-src/src/tracked_state/bench_support.rs +0 -394
  248. package/dist-engine-src/src/tracked_state/codec.rs +0 -1183
  249. package/dist-engine-src/src/tracked_state/commit_root_rebuild.rs +0 -358
  250. package/dist-engine-src/src/tracked_state/context.rs +0 -2801
  251. package/dist-engine-src/src/tracked_state/diff.rs +0 -2140
  252. package/dist-engine-src/src/tracked_state/merge.rs +0 -478
  253. package/dist-engine-src/src/tracked_state/mod.rs +0 -35
  254. package/dist-engine-src/src/tracked_state/row_materialization.rs +0 -275
  255. package/dist-engine-src/src/tracked_state/storage.rs +0 -427
  256. package/dist-engine-src/src/tracked_state/tree.rs +0 -3063
  257. package/dist-engine-src/src/tracked_state/types.rs +0 -238
  258. package/dist-engine-src/src/transaction/bench_support.rs +0 -407
  259. package/dist-engine-src/src/transaction/commit.rs +0 -1592
  260. package/dist-engine-src/src/transaction/context.rs +0 -1653
  261. package/dist-engine-src/src/transaction/mod.rs +0 -24
  262. package/dist-engine-src/src/transaction/normalization.rs +0 -877
  263. package/dist-engine-src/src/transaction/prep.rs +0 -37
  264. package/dist-engine-src/src/transaction/schema_resolver.rs +0 -163
  265. package/dist-engine-src/src/transaction/staging.rs +0 -1525
  266. package/dist-engine-src/src/transaction/types.rs +0 -403
  267. package/dist-engine-src/src/transaction/validation.rs +0 -5766
  268. package/dist-engine-src/src/untracked_state/codec.rs +0 -615
  269. package/dist-engine-src/src/untracked_state/context.rs +0 -98
  270. package/dist-engine-src/src/untracked_state/materialization.rs +0 -63
  271. package/dist-engine-src/src/untracked_state/mod.rs +0 -15
  272. package/dist-engine-src/src/untracked_state/storage.rs +0 -898
  273. package/dist-engine-src/src/untracked_state/types.rs +0 -146
  274. package/dist-engine-src/src/wasm/mod.rs +0 -60
@@ -1,645 +0,0 @@
1
- use std::any::Any;
2
- use std::collections::{BTreeMap, BTreeSet};
3
- use std::sync::Arc;
4
-
5
- use async_trait::async_trait;
6
- use datafusion::arrow::array::{ArrayRef, BooleanArray, Int64Array, StringArray};
7
- use datafusion::arrow::datatypes::{DataType, Field, Schema, SchemaRef};
8
- use datafusion::arrow::record_batch::{RecordBatch, RecordBatchOptions};
9
- use datafusion::catalog::{Session, TableProvider};
10
- use datafusion::common::{DataFusionError, Result};
11
- use datafusion::datasource::TableType;
12
- use datafusion::execution::TaskContext;
13
- use datafusion::logical_expr::{Expr, TableProviderFilterPushDown};
14
- use datafusion::physical_expr::EquivalenceProperties;
15
- use datafusion::physical_plan::execution_plan::{Boundedness, EmissionType, PlanProperties};
16
- use datafusion::physical_plan::stream::RecordBatchStreamAdapter;
17
- use datafusion::physical_plan::{
18
- DisplayAs, DisplayFormatType, ExecutionPlan, Partitioning, SendableRecordBatchStream,
19
- };
20
- use futures_util::stream;
21
- use serde::Deserialize;
22
- use tokio::sync::Mutex;
23
-
24
- use crate::commit_graph::CommitGraphReader;
25
- use crate::serialize_row_metadata;
26
- use crate::LixError;
27
-
28
- use crate::sql2::change_materialization::MaterializedChange;
29
- use crate::sql2::history_projection::{tombstone_identity_column_value, HistoryIdentityProjection};
30
- use crate::sql2::history_route::{
31
- history_descriptor_event_matches, load_history_entries, parse_history_filter,
32
- HistoryColumnStyle, HistoryEntry, HistoryRoute, HistoryViewDescriptor, HISTORY_COL_CHANGE_ID,
33
- HISTORY_COL_COMMIT_CREATED_AT, HISTORY_COL_DEPTH, HISTORY_COL_ENTITY_PK, HISTORY_COL_FILE_ID,
34
- HISTORY_COL_METADATA, HISTORY_COL_OBSERVED_COMMIT_ID, HISTORY_COL_SCHEMA_KEY,
35
- HISTORY_COL_SNAPSHOT_CONTENT, HISTORY_COL_START_COMMIT_ID,
36
- };
37
- use crate::sql2::result_metadata::json_field;
38
- use crate::sql2::SqlHistoryQuerySource;
39
- use crate::storage::StorageRead;
40
-
41
- const DIRECTORY_DESCRIPTOR_SCHEMA_KEY: &str = "lix_directory_descriptor";
42
-
43
- pub(super) async fn register_lix_directory_history_surface<S>(
44
- session: &datafusion::prelude::SessionContext,
45
- surface_name: &str,
46
- commit_graph: Box<dyn CommitGraphReader>,
47
- query_source: SqlHistoryQuerySource<S>,
48
- ) -> Result<(), LixError>
49
- where
50
- S: StorageRead + Clone + Send + Sync + 'static,
51
- {
52
- session
53
- .register_table(
54
- surface_name,
55
- Arc::new(LixDirectoryHistoryProvider::new(
56
- Arc::new(Mutex::new(commit_graph)),
57
- query_source,
58
- )),
59
- )
60
- .map_err(datafusion_error_to_lix_error)?;
61
- Ok(())
62
- }
63
-
64
- struct LixDirectoryHistoryProvider<S> {
65
- schema: SchemaRef,
66
- commit_graph: Arc<Mutex<Box<dyn CommitGraphReader>>>,
67
- query_source: SqlHistoryQuerySource<S>,
68
- }
69
-
70
- impl<S> std::fmt::Debug for LixDirectoryHistoryProvider<S> {
71
- fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
72
- f.debug_struct("LixDirectoryHistoryProvider").finish()
73
- }
74
- }
75
-
76
- impl<S> LixDirectoryHistoryProvider<S> {
77
- fn new(
78
- commit_graph: Arc<Mutex<Box<dyn CommitGraphReader>>>,
79
- query_source: SqlHistoryQuerySource<S>,
80
- ) -> Self {
81
- Self {
82
- schema: lix_directory_history_schema(),
83
- commit_graph,
84
- query_source,
85
- }
86
- }
87
- }
88
-
89
- #[async_trait]
90
- impl<S> TableProvider for LixDirectoryHistoryProvider<S>
91
- where
92
- S: StorageRead + Clone + Send + Sync + 'static,
93
- {
94
- fn as_any(&self) -> &dyn Any {
95
- self
96
- }
97
-
98
- fn schema(&self) -> SchemaRef {
99
- Arc::clone(&self.schema)
100
- }
101
-
102
- fn table_type(&self) -> TableType {
103
- TableType::View
104
- }
105
-
106
- fn supports_filters_pushdown(
107
- &self,
108
- filters: &[&Expr],
109
- ) -> Result<Vec<TableProviderFilterPushDown>> {
110
- Ok(filters
111
- .iter()
112
- .map(|filter| {
113
- if parse_history_filter(filter, HistoryColumnStyle::Prefixed).is_some() {
114
- TableProviderFilterPushDown::Exact
115
- } else {
116
- TableProviderFilterPushDown::Unsupported
117
- }
118
- })
119
- .collect())
120
- }
121
-
122
- async fn scan(
123
- &self,
124
- _state: &dyn Session,
125
- projection: Option<&Vec<usize>>,
126
- filters: &[Expr],
127
- limit: Option<usize>,
128
- ) -> Result<Arc<dyn ExecutionPlan>> {
129
- Ok(Arc::new(LixDirectoryHistoryScanExec::new(
130
- Arc::clone(&self.commit_graph),
131
- self.query_source.clone(),
132
- projected_schema(&self.schema, projection)?,
133
- HistoryRoute::from_filters(filters, HistoryColumnStyle::Prefixed),
134
- limit,
135
- )))
136
- }
137
- }
138
-
139
- struct LixDirectoryHistoryScanExec<S> {
140
- commit_graph: Arc<Mutex<Box<dyn CommitGraphReader>>>,
141
- query_source: SqlHistoryQuerySource<S>,
142
- schema: SchemaRef,
143
- route: HistoryRoute,
144
- limit: Option<usize>,
145
- properties: Arc<PlanProperties>,
146
- }
147
-
148
- impl<S> std::fmt::Debug for LixDirectoryHistoryScanExec<S> {
149
- fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
150
- f.debug_struct("LixDirectoryHistoryScanExec")
151
- .field("route", &self.route)
152
- .field("limit", &self.limit)
153
- .finish()
154
- }
155
- }
156
-
157
- impl<S> LixDirectoryHistoryScanExec<S> {
158
- fn new(
159
- commit_graph: Arc<Mutex<Box<dyn CommitGraphReader>>>,
160
- query_source: SqlHistoryQuerySource<S>,
161
- schema: SchemaRef,
162
- route: HistoryRoute,
163
- limit: Option<usize>,
164
- ) -> Self {
165
- let properties = PlanProperties::new(
166
- EquivalenceProperties::new(Arc::clone(&schema)),
167
- Partitioning::UnknownPartitioning(1),
168
- EmissionType::Incremental,
169
- Boundedness::Bounded,
170
- );
171
- Self {
172
- commit_graph,
173
- query_source,
174
- schema,
175
- route,
176
- limit,
177
- properties: Arc::new(properties),
178
- }
179
- }
180
- }
181
-
182
- impl<S> DisplayAs for LixDirectoryHistoryScanExec<S> {
183
- fn fmt_as(&self, t: DisplayFormatType, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
184
- match t {
185
- DisplayFormatType::Default | DisplayFormatType::Verbose => write!(
186
- f,
187
- "LixDirectoryHistoryScanExec(route={:?}, limit={:?})",
188
- self.route, self.limit
189
- ),
190
- DisplayFormatType::TreeRender => write!(f, "LixDirectoryHistoryScanExec"),
191
- }
192
- }
193
- }
194
-
195
- impl<S> ExecutionPlan for LixDirectoryHistoryScanExec<S>
196
- where
197
- S: StorageRead + Clone + Send + Sync + 'static,
198
- {
199
- fn name(&self) -> &str {
200
- "LixDirectoryHistoryScanExec"
201
- }
202
-
203
- fn as_any(&self) -> &dyn Any {
204
- self
205
- }
206
-
207
- fn properties(&self) -> &Arc<PlanProperties> {
208
- &self.properties
209
- }
210
-
211
- fn children(&self) -> Vec<&Arc<dyn ExecutionPlan>> {
212
- Vec::new()
213
- }
214
-
215
- fn with_new_children(
216
- self: Arc<Self>,
217
- children: Vec<Arc<dyn ExecutionPlan>>,
218
- ) -> Result<Arc<dyn ExecutionPlan>> {
219
- if !children.is_empty() {
220
- return Err(DataFusionError::Execution(
221
- "LixDirectoryHistoryScanExec does not accept children".to_string(),
222
- ));
223
- }
224
- Ok(self)
225
- }
226
-
227
- fn execute(
228
- &self,
229
- partition: usize,
230
- _context: Arc<TaskContext>,
231
- ) -> Result<SendableRecordBatchStream> {
232
- if partition != 0 {
233
- return Err(DataFusionError::Execution(format!(
234
- "LixDirectoryHistoryScanExec only exposes one partition, got {partition}"
235
- )));
236
- }
237
-
238
- let commit_graph = Arc::clone(&self.commit_graph);
239
- let query_source = self.query_source.clone();
240
- let schema = Arc::clone(&self.schema);
241
- let stream_schema = Arc::clone(&schema);
242
- let route = self.route.clone();
243
- let limit = self.limit;
244
- let fut = async move {
245
- let mut rows = load_directory_history_rows(commit_graph, query_source, &route)
246
- .await
247
- .map_err(lix_error_to_datafusion_error)?;
248
- if let Some(limit) = limit {
249
- rows.truncate(limit);
250
- }
251
- directory_history_record_batch(&stream_schema, &rows)
252
- .map_err(lix_error_to_datafusion_error)
253
- };
254
-
255
- Ok(Box::pin(RecordBatchStreamAdapter::new(
256
- schema,
257
- stream::once(fut),
258
- )))
259
- }
260
- }
261
-
262
- #[derive(Debug, Clone)]
263
- struct DirectoryHistoryRecord {
264
- id: String,
265
- parent_id: Option<String>,
266
- name: Option<String>,
267
- hidden: Option<bool>,
268
- entry: HistoryEntry,
269
- }
270
-
271
- #[derive(Debug, Clone)]
272
- struct DirectoryHistoryOutputRow {
273
- entity_pk: String,
274
- id: String,
275
- path: Option<String>,
276
- parent_id: Option<String>,
277
- name: Option<String>,
278
- hidden: Option<bool>,
279
- descriptor_change: MaterializedChange,
280
- event: DirectoryHistoryEvent,
281
- }
282
-
283
- #[derive(Debug, Clone)]
284
- struct DirectoryHistoryEvent {
285
- directory_id: String,
286
- start_commit_id: String,
287
- depth: u32,
288
- change: MaterializedChange,
289
- observed_commit_id: String,
290
- commit_created_at: String,
291
- }
292
-
293
- #[derive(Debug, Deserialize)]
294
- struct DirectoryDescriptorSnapshot {
295
- id: String,
296
- parent_id: Option<String>,
297
- name: String,
298
- hidden: Option<bool>,
299
- }
300
-
301
- async fn load_directory_history_rows<S>(
302
- commit_graph: Arc<Mutex<Box<dyn CommitGraphReader>>>,
303
- query_source: SqlHistoryQuerySource<S>,
304
- route: &HistoryRoute,
305
- ) -> Result<Vec<DirectoryHistoryOutputRow>, LixError>
306
- where
307
- S: StorageRead + Clone + Send + Sync + 'static,
308
- {
309
- let event_route = route.traversal_only();
310
- let event_entries = load_history_entries(
311
- HistoryViewDescriptor {
312
- view_name: "lix_directory_history",
313
- start_commit_column: HISTORY_COL_START_COMMIT_ID,
314
- },
315
- Arc::clone(&commit_graph),
316
- query_source.json_reader.clone(),
317
- &event_route,
318
- vec![DIRECTORY_DESCRIPTOR_SCHEMA_KEY.to_string()],
319
- )
320
- .await?;
321
- let context_route = route.starts_only();
322
- let context_entries = load_history_entries(
323
- HistoryViewDescriptor {
324
- view_name: "lix_directory_history",
325
- start_commit_column: HISTORY_COL_START_COMMIT_ID,
326
- },
327
- commit_graph,
328
- query_source.json_reader,
329
- &context_route,
330
- vec![DIRECTORY_DESCRIPTOR_SCHEMA_KEY.to_string()],
331
- )
332
- .await?;
333
- let event_descriptors = parse_directory_history_records(&event_entries)?;
334
- let descriptors = parse_directory_history_records(&context_entries)?;
335
- let mut output = Vec::new();
336
-
337
- for descriptor in &event_descriptors {
338
- let event = directory_history_event_from_entry(&descriptor.id, &descriptor.entry);
339
- let Some(visible_descriptor) = nearest_directory_descriptor(&descriptors, &event) else {
340
- continue;
341
- };
342
- let path = if visible_descriptor.name.is_some() {
343
- resolve_directory_history_path(
344
- &visible_descriptor.id,
345
- &event.start_commit_id,
346
- event.depth,
347
- &descriptors,
348
- &mut BTreeMap::new(),
349
- &mut BTreeSet::new(),
350
- )
351
- } else {
352
- None
353
- };
354
- let id = tombstone_identity_column_value(
355
- "id",
356
- &visible_descriptor.id,
357
- HistoryIdentityProjection::SingleColumn { column: "id" },
358
- )?
359
- .and_then(|value| value.as_str().map(ToOwned::to_owned))
360
- .unwrap_or_else(|| visible_descriptor.id.clone());
361
- output.push(DirectoryHistoryOutputRow {
362
- entity_pk: visible_descriptor.id.clone(),
363
- id,
364
- path,
365
- parent_id: visible_descriptor.parent_id.clone(),
366
- name: visible_descriptor.name.clone(),
367
- hidden: visible_descriptor.hidden,
368
- descriptor_change: visible_descriptor.entry.change.clone(),
369
- event,
370
- });
371
- }
372
- output.retain(|row| {
373
- let entity_pk = entity_pk_json_array(&row.entity_pk).ok();
374
- route.matches_surface_row(
375
- DIRECTORY_DESCRIPTOR_SCHEMA_KEY,
376
- entity_pk.as_deref().unwrap_or(&row.entity_pk),
377
- None,
378
- row.event.depth,
379
- )
380
- });
381
-
382
- output.sort_by(|left, right| {
383
- left.entity_pk
384
- .cmp(&right.entity_pk)
385
- .then(left.event.start_commit_id.cmp(&right.event.start_commit_id))
386
- .then(left.event.depth.cmp(&right.event.depth))
387
- .then(
388
- left.event
389
- .observed_commit_id
390
- .cmp(&right.event.observed_commit_id),
391
- )
392
- .then(left.event.change.id.cmp(&right.event.change.id))
393
- });
394
- Ok(output)
395
- }
396
-
397
- fn parse_directory_history_records(
398
- entries: &[HistoryEntry],
399
- ) -> Result<Vec<DirectoryHistoryRecord>, LixError> {
400
- entries
401
- .iter()
402
- .filter(|entry| entry.change.schema_key == DIRECTORY_DESCRIPTOR_SCHEMA_KEY)
403
- .map(|entry| {
404
- let Some(snapshot_content) = entry.change.snapshot_content.as_deref() else {
405
- return Ok(DirectoryHistoryRecord {
406
- id: entry.change.entity_pk.as_single_string_owned()?,
407
- parent_id: None,
408
- name: None,
409
- hidden: None,
410
- entry: entry.clone(),
411
- });
412
- };
413
- let snapshot: DirectoryDescriptorSnapshot = serde_json::from_str(snapshot_content)
414
- .map_err(|error| {
415
- LixError::new(
416
- "LIX_ERROR_UNKNOWN",
417
- format!("invalid lix_directory_descriptor history snapshot JSON: {error}"),
418
- )
419
- })?;
420
- Ok(DirectoryHistoryRecord {
421
- id: snapshot.id,
422
- parent_id: snapshot.parent_id,
423
- name: Some(snapshot.name),
424
- hidden: Some(snapshot.hidden.unwrap_or(false)),
425
- entry: entry.clone(),
426
- })
427
- })
428
- .collect()
429
- }
430
-
431
- fn directory_history_event_from_entry(
432
- directory_id: &str,
433
- entry: &HistoryEntry,
434
- ) -> DirectoryHistoryEvent {
435
- DirectoryHistoryEvent {
436
- directory_id: directory_id.to_string(),
437
- start_commit_id: entry.start_commit_id.clone(),
438
- depth: entry.depth,
439
- change: entry.change.clone(),
440
- observed_commit_id: entry.observed_commit_id.clone(),
441
- commit_created_at: entry.commit_created_at.clone(),
442
- }
443
- }
444
-
445
- fn nearest_directory_descriptor<'a>(
446
- descriptors: &'a [DirectoryHistoryRecord],
447
- event: &DirectoryHistoryEvent,
448
- ) -> Option<&'a DirectoryHistoryRecord> {
449
- descriptors
450
- .iter()
451
- .filter(|descriptor| {
452
- let exact_descriptor_event =
453
- history_descriptor_event_matches(&descriptor.entry, event.depth, &event.change.id);
454
- (exact_descriptor_event || descriptor.name.is_some())
455
- && descriptor.id == event.directory_id
456
- && descriptor.entry.start_commit_id == event.start_commit_id
457
- && descriptor.entry.depth >= event.depth
458
- })
459
- .min_by(|left, right| {
460
- left.entry
461
- .depth
462
- .cmp(&right.entry.depth)
463
- .then(left.entry.change.id.cmp(&right.entry.change.id))
464
- })
465
- }
466
-
467
- fn resolve_directory_history_path(
468
- directory_id: &str,
469
- start_commit_id: &str,
470
- target_depth: u32,
471
- directories: &[DirectoryHistoryRecord],
472
- cache: &mut BTreeMap<String, Option<String>>,
473
- visiting: &mut BTreeSet<String>,
474
- ) -> Option<String> {
475
- if let Some(path) = cache.get(directory_id) {
476
- return path.clone();
477
- }
478
- if !visiting.insert(directory_id.to_string()) {
479
- cache.insert(directory_id.to_string(), None);
480
- return None;
481
- }
482
- let directory = directories
483
- .iter()
484
- .filter(|directory| {
485
- directory.name.is_some()
486
- && directory.id == directory_id
487
- && directory.entry.start_commit_id == start_commit_id
488
- && directory.entry.depth >= target_depth
489
- })
490
- .min_by(|left, right| {
491
- left.entry
492
- .depth
493
- .cmp(&right.entry.depth)
494
- .then(left.entry.change.id.cmp(&right.entry.change.id))
495
- })?;
496
- let name = directory.name.as_ref()?;
497
- let path = match directory.parent_id.as_deref() {
498
- Some(parent_id) => {
499
- let parent_path = resolve_directory_history_path(
500
- parent_id,
501
- start_commit_id,
502
- target_depth,
503
- directories,
504
- cache,
505
- visiting,
506
- )?;
507
- format!("{parent_path}{name}/")
508
- }
509
- None => format!("/{name}/"),
510
- };
511
- visiting.remove(directory_id);
512
- cache.insert(directory_id.to_string(), Some(path.clone()));
513
- Some(path)
514
- }
515
-
516
- fn directory_history_record_batch(
517
- schema: &SchemaRef,
518
- rows: &[DirectoryHistoryOutputRow],
519
- ) -> Result<RecordBatch, LixError> {
520
- let columns = schema
521
- .fields()
522
- .iter()
523
- .map(|field| directory_history_column_array(field.name(), rows))
524
- .collect::<Result<Vec<_>, _>>()?;
525
- let options = RecordBatchOptions::new().with_row_count(Some(rows.len()));
526
- RecordBatch::try_new_with_options(Arc::clone(schema), columns, &options).map_err(|error| {
527
- LixError::new(
528
- "LIX_ERROR_UNKNOWN",
529
- format!("sql2 failed to build lix_directory_history record batch: {error}"),
530
- )
531
- })
532
- }
533
-
534
- fn directory_history_column_array(
535
- column_name: &str,
536
- rows: &[DirectoryHistoryOutputRow],
537
- ) -> Result<ArrayRef, LixError> {
538
- Ok(match column_name {
539
- "id" => string_array(rows.iter().map(|row| Some(row.id.as_str()))),
540
- "path" => string_array(rows.iter().map(|row| row.path.as_deref())),
541
- "parent_id" => string_array(rows.iter().map(|row| row.parent_id.as_deref())),
542
- "name" => string_array(rows.iter().map(|row| row.name.as_deref())),
543
- "hidden" => Arc::new(BooleanArray::from(
544
- rows.iter().map(|row| row.hidden).collect::<Vec<_>>(),
545
- )) as ArrayRef,
546
- HISTORY_COL_ENTITY_PK => Arc::new(StringArray::from(
547
- rows.iter()
548
- .map(|row| entity_pk_json_array(&row.entity_pk).map(Some))
549
- .collect::<std::result::Result<Vec<_>, _>>()?,
550
- )) as ArrayRef,
551
- HISTORY_COL_SCHEMA_KEY => {
552
- string_array(rows.iter().map(|_| Some(DIRECTORY_DESCRIPTOR_SCHEMA_KEY)))
553
- }
554
- HISTORY_COL_FILE_ID => string_array(rows.iter().map(|_| None)),
555
- HISTORY_COL_CHANGE_ID => {
556
- string_array(rows.iter().map(|row| Some(row.event.change.id.as_str())))
557
- }
558
- HISTORY_COL_SNAPSHOT_CONTENT => string_array(
559
- rows.iter()
560
- .map(|row| row.descriptor_change.snapshot_content.as_deref()),
561
- ),
562
- HISTORY_COL_METADATA => Arc::new(StringArray::from(
563
- rows.iter()
564
- .map(|row| {
565
- row.descriptor_change
566
- .metadata
567
- .as_ref()
568
- .map(serialize_row_metadata)
569
- })
570
- .collect::<Vec<_>>(),
571
- )),
572
- HISTORY_COL_OBSERVED_COMMIT_ID => string_array(
573
- rows.iter()
574
- .map(|row| Some(row.event.observed_commit_id.as_str())),
575
- ),
576
- HISTORY_COL_COMMIT_CREATED_AT => string_array(
577
- rows.iter()
578
- .map(|row| Some(row.event.commit_created_at.as_str())),
579
- ),
580
- HISTORY_COL_START_COMMIT_ID => string_array(
581
- rows.iter()
582
- .map(|row| Some(row.event.start_commit_id.as_str())),
583
- ),
584
- HISTORY_COL_DEPTH => Arc::new(Int64Array::from(
585
- rows.iter()
586
- .map(|row| i64::from(row.event.depth))
587
- .collect::<Vec<_>>(),
588
- )) as ArrayRef,
589
- other => {
590
- return Err(LixError::new(
591
- "LIX_ERROR_UNKNOWN",
592
- format!(
593
- "sql2 lix_directory_history provider does not support projected column '{other}'"
594
- ),
595
- ))
596
- }
597
- })
598
- }
599
-
600
- pub(super) fn lix_directory_history_schema() -> SchemaRef {
601
- Arc::new(Schema::new(vec![
602
- Field::new("id", DataType::Utf8, false),
603
- Field::new("path", DataType::Utf8, true),
604
- Field::new("parent_id", DataType::Utf8, true),
605
- Field::new("name", DataType::Utf8, true),
606
- Field::new("hidden", DataType::Boolean, true),
607
- json_field(HISTORY_COL_ENTITY_PK, false),
608
- Field::new(HISTORY_COL_SCHEMA_KEY, DataType::Utf8, false),
609
- Field::new(HISTORY_COL_FILE_ID, DataType::Utf8, true),
610
- json_field(HISTORY_COL_SNAPSHOT_CONTENT, true),
611
- Field::new(HISTORY_COL_CHANGE_ID, DataType::Utf8, false),
612
- json_field(HISTORY_COL_METADATA, true),
613
- Field::new(HISTORY_COL_OBSERVED_COMMIT_ID, DataType::Utf8, false),
614
- Field::new(HISTORY_COL_COMMIT_CREATED_AT, DataType::Utf8, false),
615
- Field::new(HISTORY_COL_START_COMMIT_ID, DataType::Utf8, false),
616
- Field::new(HISTORY_COL_DEPTH, DataType::Int64, false),
617
- ]))
618
- }
619
-
620
- fn projected_schema(base_schema: &SchemaRef, projection: Option<&Vec<usize>>) -> Result<SchemaRef> {
621
- let Some(projection) = projection else {
622
- return Ok(Arc::clone(base_schema));
623
- };
624
- Ok(Arc::new(base_schema.project(projection)?))
625
- }
626
-
627
- fn string_array<'a>(values: impl Iterator<Item = Option<&'a str>>) -> ArrayRef {
628
- Arc::new(StringArray::from(values.collect::<Vec<_>>())) as ArrayRef
629
- }
630
-
631
- fn datafusion_error_to_lix_error(error: DataFusionError) -> LixError {
632
- crate::sql2::error::datafusion_error_to_lix_error(error)
633
- }
634
-
635
- fn entity_pk_json_array(entity_pk: &str) -> Result<String, LixError> {
636
- serde_json::to_string(&[entity_pk]).map_err(|error| {
637
- LixError::unknown(format!(
638
- "failed to encode history entity pk as JSON: {error}"
639
- ))
640
- })
641
- }
642
-
643
- fn lix_error_to_datafusion_error(error: LixError) -> DataFusionError {
644
- crate::sql2::error::lix_error_to_datafusion_error(error)
645
- }