@lix-js/sdk 0.6.0-preview.1 → 0.6.0-preview.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (205) hide show
  1. package/SKILL.md +304 -320
  2. package/dist/engine-wasm/wasm/lix_engine.d.ts +5 -0
  3. package/dist/engine-wasm/wasm/lix_engine.js +9 -13
  4. package/dist/engine-wasm/wasm/lix_engine.wasm +0 -0
  5. package/dist/engine-wasm/wasm/lix_engine.wasm.d.ts +1 -0
  6. package/dist/generated/builtin-schemas.d.ts +87 -162
  7. package/dist/generated/builtin-schemas.js +139 -236
  8. package/dist/open-lix.d.ts +103 -14
  9. package/dist/open-lix.js +3 -0
  10. package/dist/sqlite/index.js +99 -22
  11. package/dist-engine-src/README.md +18 -0
  12. package/dist-engine-src/src/backend/kv.rs +358 -0
  13. package/dist-engine-src/src/backend/mod.rs +12 -0
  14. package/dist-engine-src/src/backend/testing.rs +658 -0
  15. package/dist-engine-src/src/backend/types.rs +96 -0
  16. package/dist-engine-src/src/binary_cas/chunking.rs +31 -0
  17. package/dist-engine-src/src/binary_cas/codec.rs +346 -0
  18. package/dist-engine-src/src/binary_cas/context.rs +139 -0
  19. package/dist-engine-src/src/binary_cas/kv.rs +1063 -0
  20. package/dist-engine-src/src/binary_cas/mod.rs +11 -0
  21. package/dist-engine-src/src/binary_cas/types.rs +121 -0
  22. package/dist-engine-src/src/catalog/context.rs +412 -0
  23. package/dist-engine-src/src/catalog/mod.rs +10 -0
  24. package/dist-engine-src/src/catalog/schema.rs +4 -0
  25. package/dist-engine-src/src/catalog/snapshot.rs +1114 -0
  26. package/dist-engine-src/src/cel/context.rs +86 -0
  27. package/dist-engine-src/src/cel/error.rs +19 -0
  28. package/dist-engine-src/src/cel/mod.rs +8 -0
  29. package/dist-engine-src/src/cel/provider.rs +9 -0
  30. package/dist-engine-src/src/cel/runtime.rs +167 -0
  31. package/dist-engine-src/src/cel/value.rs +50 -0
  32. package/dist-engine-src/src/commit_graph/context.rs +901 -0
  33. package/dist-engine-src/src/commit_graph/mod.rs +11 -0
  34. package/dist-engine-src/src/commit_graph/types.rs +109 -0
  35. package/dist-engine-src/src/commit_graph/walker.rs +756 -0
  36. package/dist-engine-src/src/commit_store/codec.rs +887 -0
  37. package/dist-engine-src/src/commit_store/context.rs +944 -0
  38. package/dist-engine-src/src/commit_store/materialization.rs +84 -0
  39. package/dist-engine-src/src/commit_store/mod.rs +16 -0
  40. package/dist-engine-src/src/commit_store/storage.rs +600 -0
  41. package/dist-engine-src/src/commit_store/types.rs +215 -0
  42. package/dist-engine-src/src/common/error.rs +313 -0
  43. package/dist-engine-src/src/common/fingerprint.rs +3 -0
  44. package/dist-engine-src/src/common/fs_path.rs +1336 -0
  45. package/dist-engine-src/src/common/identity.rs +145 -0
  46. package/dist-engine-src/src/common/json_pointer.rs +67 -0
  47. package/dist-engine-src/src/common/metadata.rs +40 -0
  48. package/dist-engine-src/src/common/mod.rs +23 -0
  49. package/dist-engine-src/src/common/types.rs +105 -0
  50. package/dist-engine-src/src/common/wire.rs +222 -0
  51. package/dist-engine-src/src/domain.rs +324 -0
  52. package/dist-engine-src/src/engine.rs +225 -0
  53. package/dist-engine-src/src/entity_identity.rs +405 -0
  54. package/dist-engine-src/src/functions/context.rs +292 -0
  55. package/dist-engine-src/src/functions/deterministic.rs +113 -0
  56. package/dist-engine-src/src/functions/mod.rs +18 -0
  57. package/dist-engine-src/src/functions/provider.rs +130 -0
  58. package/dist-engine-src/src/functions/state.rs +336 -0
  59. package/dist-engine-src/src/functions/types.rs +37 -0
  60. package/dist-engine-src/src/init.rs +558 -0
  61. package/dist-engine-src/src/json_store/compression.rs +77 -0
  62. package/dist-engine-src/src/json_store/context.rs +423 -0
  63. package/dist-engine-src/src/json_store/encoded.rs +15 -0
  64. package/dist-engine-src/src/json_store/mod.rs +12 -0
  65. package/dist-engine-src/src/json_store/store.rs +1109 -0
  66. package/dist-engine-src/src/json_store/types.rs +217 -0
  67. package/dist-engine-src/src/lib.rs +62 -0
  68. package/dist-engine-src/src/live_state/context.rs +2019 -0
  69. package/dist-engine-src/src/live_state/mod.rs +15 -0
  70. package/dist-engine-src/src/live_state/overlay.rs +75 -0
  71. package/dist-engine-src/src/live_state/reader.rs +23 -0
  72. package/dist-engine-src/src/live_state/types.rs +222 -0
  73. package/dist-engine-src/src/live_state/visibility.rs +223 -0
  74. package/dist-engine-src/src/plugin/archive.rs +438 -0
  75. package/dist-engine-src/src/plugin/component.rs +183 -0
  76. package/dist-engine-src/src/plugin/install.rs +619 -0
  77. package/dist-engine-src/src/plugin/manifest.rs +516 -0
  78. package/dist-engine-src/src/plugin/materializer.rs +477 -0
  79. package/dist-engine-src/src/plugin/mod.rs +33 -0
  80. package/dist-engine-src/src/plugin/plugin_manifest.json +118 -0
  81. package/dist-engine-src/src/plugin/storage.rs +74 -0
  82. package/dist-engine-src/src/schema/annotations/defaults.rs +275 -0
  83. package/dist-engine-src/src/schema/annotations/mod.rs +1 -0
  84. package/dist-engine-src/src/schema/builtin/lix_account.json +21 -0
  85. package/dist-engine-src/src/schema/builtin/lix_active_account.json +29 -0
  86. package/dist-engine-src/src/schema/builtin/lix_binary_blob_ref.json +29 -0
  87. package/dist-engine-src/src/schema/builtin/lix_change.json +63 -0
  88. package/dist-engine-src/src/schema/builtin/lix_change_author.json +45 -0
  89. package/dist-engine-src/src/schema/builtin/lix_commit.json +24 -0
  90. package/dist-engine-src/src/schema/builtin/lix_commit_edge.json +53 -0
  91. package/dist-engine-src/src/schema/builtin/lix_directory_descriptor.json +52 -0
  92. package/dist-engine-src/src/schema/builtin/lix_file_descriptor.json +52 -0
  93. package/dist-engine-src/src/schema/builtin/lix_key_value.json +40 -0
  94. package/dist-engine-src/src/schema/builtin/lix_label.json +29 -0
  95. package/dist-engine-src/src/schema/builtin/lix_label_assignment.json +74 -0
  96. package/dist-engine-src/src/schema/builtin/lix_registered_schema.json +25 -0
  97. package/dist-engine-src/src/schema/builtin/lix_version_descriptor.json +34 -0
  98. package/dist-engine-src/src/schema/builtin/lix_version_ref.json +48 -0
  99. package/dist-engine-src/src/schema/builtin/mod.rs +222 -0
  100. package/dist-engine-src/src/schema/compatibility.rs +787 -0
  101. package/dist-engine-src/src/schema/definition.json +187 -0
  102. package/dist-engine-src/src/schema/definition.rs +742 -0
  103. package/dist-engine-src/src/schema/key.rs +138 -0
  104. package/dist-engine-src/src/schema/mod.rs +20 -0
  105. package/dist-engine-src/src/schema/seed.rs +14 -0
  106. package/dist-engine-src/src/schema/tests.rs +780 -0
  107. package/dist-engine-src/src/session/context.rs +364 -0
  108. package/dist-engine-src/src/session/create_version.rs +88 -0
  109. package/dist-engine-src/src/session/execute.rs +478 -0
  110. package/dist-engine-src/src/session/merge/analysis.rs +102 -0
  111. package/dist-engine-src/src/session/merge/apply.rs +23 -0
  112. package/dist-engine-src/src/session/merge/conflicts.rs +63 -0
  113. package/dist-engine-src/src/session/merge/mod.rs +11 -0
  114. package/dist-engine-src/src/session/merge/stats.rs +65 -0
  115. package/dist-engine-src/src/session/merge/version.rs +427 -0
  116. package/dist-engine-src/src/session/mod.rs +27 -0
  117. package/dist-engine-src/src/session/optimization9_sql2_bench.rs +100 -0
  118. package/dist-engine-src/src/session/switch_version.rs +109 -0
  119. package/dist-engine-src/src/sql2/change_provider.rs +331 -0
  120. package/dist-engine-src/src/sql2/classify.rs +182 -0
  121. package/dist-engine-src/src/sql2/context.rs +311 -0
  122. package/dist-engine-src/src/sql2/directory_history_provider.rs +631 -0
  123. package/dist-engine-src/src/sql2/directory_provider.rs +2453 -0
  124. package/dist-engine-src/src/sql2/dml.rs +148 -0
  125. package/dist-engine-src/src/sql2/entity_history_provider.rs +440 -0
  126. package/dist-engine-src/src/sql2/entity_provider.rs +3211 -0
  127. package/dist-engine-src/src/sql2/error.rs +216 -0
  128. package/dist-engine-src/src/sql2/execute.rs +3440 -0
  129. package/dist-engine-src/src/sql2/file_history_provider.rs +910 -0
  130. package/dist-engine-src/src/sql2/file_provider.rs +3679 -0
  131. package/dist-engine-src/src/sql2/filesystem_planner.rs +1490 -0
  132. package/dist-engine-src/src/sql2/filesystem_predicates.rs +159 -0
  133. package/dist-engine-src/src/sql2/filesystem_visibility.rs +383 -0
  134. package/dist-engine-src/src/sql2/history_projection.rs +56 -0
  135. package/dist-engine-src/src/sql2/history_provider.rs +412 -0
  136. package/dist-engine-src/src/sql2/history_route.rs +657 -0
  137. package/dist-engine-src/src/sql2/lix_state_provider.rs +2512 -0
  138. package/dist-engine-src/src/sql2/mod.rs +46 -0
  139. package/dist-engine-src/src/sql2/predicate_typecheck.rs +246 -0
  140. package/dist-engine-src/src/sql2/public_bind/assignment.rs +46 -0
  141. package/dist-engine-src/src/sql2/public_bind/capability.rs +41 -0
  142. package/dist-engine-src/src/sql2/public_bind/dml.rs +166 -0
  143. package/dist-engine-src/src/sql2/public_bind/mod.rs +25 -0
  144. package/dist-engine-src/src/sql2/public_bind/table.rs +168 -0
  145. package/dist-engine-src/src/sql2/read_only.rs +63 -0
  146. package/dist-engine-src/src/sql2/record_batch.rs +17 -0
  147. package/dist-engine-src/src/sql2/result_metadata.rs +29 -0
  148. package/dist-engine-src/src/sql2/runtime.rs +60 -0
  149. package/dist-engine-src/src/sql2/session.rs +132 -0
  150. package/dist-engine-src/src/sql2/udfs/common.rs +295 -0
  151. package/dist-engine-src/src/sql2/udfs/lix_active_version_commit_id.rs +53 -0
  152. package/dist-engine-src/src/sql2/udfs/lix_empty_blob.rs +47 -0
  153. package/dist-engine-src/src/sql2/udfs/lix_json.rs +100 -0
  154. package/dist-engine-src/src/sql2/udfs/lix_json_get.rs +99 -0
  155. package/dist-engine-src/src/sql2/udfs/lix_json_get_text.rs +99 -0
  156. package/dist-engine-src/src/sql2/udfs/lix_text_decode.rs +82 -0
  157. package/dist-engine-src/src/sql2/udfs/lix_text_encode.rs +85 -0
  158. package/dist-engine-src/src/sql2/udfs/lix_timestamp.rs +76 -0
  159. package/dist-engine-src/src/sql2/udfs/lix_uuid_v7.rs +76 -0
  160. package/dist-engine-src/src/sql2/udfs/mod.rs +89 -0
  161. package/dist-engine-src/src/sql2/udfs/public_call.rs +211 -0
  162. package/dist-engine-src/src/sql2/version_provider.rs +1202 -0
  163. package/dist-engine-src/src/sql2/version_scope.rs +394 -0
  164. package/dist-engine-src/src/sql2/write_normalization.rs +345 -0
  165. package/dist-engine-src/src/storage/context.rs +356 -0
  166. package/dist-engine-src/src/storage/mod.rs +14 -0
  167. package/dist-engine-src/src/storage/read_scope.rs +88 -0
  168. package/dist-engine-src/src/storage/types.rs +501 -0
  169. package/dist-engine-src/src/storage_bench.rs +4863 -0
  170. package/dist-engine-src/src/test_support.rs +228 -0
  171. package/dist-engine-src/src/tracked_state/by_file_index.rs +98 -0
  172. package/dist-engine-src/src/tracked_state/codec.rs +2085 -0
  173. package/dist-engine-src/src/tracked_state/context.rs +1867 -0
  174. package/dist-engine-src/src/tracked_state/diff.rs +686 -0
  175. package/dist-engine-src/src/tracked_state/materialization.rs +403 -0
  176. package/dist-engine-src/src/tracked_state/materializer.rs +488 -0
  177. package/dist-engine-src/src/tracked_state/merge.rs +492 -0
  178. package/dist-engine-src/src/tracked_state/mod.rs +32 -0
  179. package/dist-engine-src/src/tracked_state/storage.rs +375 -0
  180. package/dist-engine-src/src/tracked_state/tree.rs +3187 -0
  181. package/dist-engine-src/src/tracked_state/types.rs +231 -0
  182. package/dist-engine-src/src/transaction/commit.rs +1484 -0
  183. package/dist-engine-src/src/transaction/context.rs +1548 -0
  184. package/dist-engine-src/src/transaction/live_state_overlay.rs +35 -0
  185. package/dist-engine-src/src/transaction/mod.rs +13 -0
  186. package/dist-engine-src/src/transaction/normalization.rs +890 -0
  187. package/dist-engine-src/src/transaction/prep.rs +37 -0
  188. package/dist-engine-src/src/transaction/schema_resolver.rs +149 -0
  189. package/dist-engine-src/src/transaction/staging.rs +1731 -0
  190. package/dist-engine-src/src/transaction/types.rs +460 -0
  191. package/dist-engine-src/src/transaction/validation.rs +5830 -0
  192. package/dist-engine-src/src/untracked_state/codec.rs +307 -0
  193. package/dist-engine-src/src/untracked_state/context.rs +98 -0
  194. package/dist-engine-src/src/untracked_state/materialization.rs +63 -0
  195. package/dist-engine-src/src/untracked_state/mod.rs +15 -0
  196. package/dist-engine-src/src/untracked_state/storage.rs +396 -0
  197. package/dist-engine-src/src/untracked_state/types.rs +146 -0
  198. package/dist-engine-src/src/version/context.rs +40 -0
  199. package/dist-engine-src/src/version/lifecycle.rs +221 -0
  200. package/dist-engine-src/src/version/mod.rs +13 -0
  201. package/dist-engine-src/src/version/refs.rs +330 -0
  202. package/dist-engine-src/src/version/stage_rows.rs +67 -0
  203. package/dist-engine-src/src/version/types.rs +21 -0
  204. package/dist-engine-src/src/wasm/mod.rs +60 -0
  205. package/package.json +68 -64
@@ -0,0 +1,159 @@
1
+ use datafusion::common::tree_node::{Transformed, TreeNode};
2
+ use datafusion::common::{DataFusionError, Result, ScalarValue};
3
+ use datafusion::logical_expr::expr::{Between, InList};
4
+ use datafusion::logical_expr::{BinaryExpr, Expr, Operator};
5
+
6
+ use crate::common::{normalize_directory_path, ParsedFilePath};
7
+ use crate::LixError;
8
+
9
+ use super::error::lix_error_to_datafusion_error;
10
+
11
+ #[derive(Debug, Clone, Copy)]
12
+ pub(crate) enum FilesystemPathKind {
13
+ File,
14
+ Directory,
15
+ }
16
+
17
+ pub(crate) fn canonicalize_filesystem_path_filters(
18
+ filters: &[Expr],
19
+ kind: FilesystemPathKind,
20
+ ) -> Result<Vec<Expr>> {
21
+ filters
22
+ .iter()
23
+ .cloned()
24
+ .map(|filter| canonicalize_filesystem_path_filter(filter, kind))
25
+ .collect()
26
+ }
27
+
28
+ fn canonicalize_filesystem_path_filter(expr: Expr, kind: FilesystemPathKind) -> Result<Expr> {
29
+ expr.transform(|expr| canonicalize_filesystem_path_expr(expr, kind))
30
+ .map(|transformed| transformed.data)
31
+ }
32
+
33
+ fn canonicalize_filesystem_path_expr(
34
+ expr: Expr,
35
+ kind: FilesystemPathKind,
36
+ ) -> Result<Transformed<Expr>> {
37
+ match expr {
38
+ Expr::BinaryExpr(binary_expr) if is_path_comparison_operator(binary_expr.op) => {
39
+ canonicalize_path_binary_expr(binary_expr, kind)
40
+ }
41
+ Expr::InList(in_list) if is_path_column(&in_list.expr) => {
42
+ canonicalize_path_in_list(in_list, kind)
43
+ }
44
+ Expr::Between(between) if is_path_column(&between.expr) => {
45
+ canonicalize_path_between(between, kind)
46
+ }
47
+ _ => Ok(Transformed::no(expr)),
48
+ }
49
+ }
50
+
51
+ fn canonicalize_path_binary_expr(
52
+ binary_expr: BinaryExpr,
53
+ kind: FilesystemPathKind,
54
+ ) -> Result<Transformed<Expr>> {
55
+ let BinaryExpr { left, op, right } = binary_expr;
56
+ let left_is_path = is_path_column(&left);
57
+ let right_is_path = is_path_column(&right);
58
+
59
+ let left = if right_is_path {
60
+ Box::new(canonicalize_path_literal_expr(*left, kind)?)
61
+ } else {
62
+ left
63
+ };
64
+ let right = if left_is_path {
65
+ Box::new(canonicalize_path_literal_expr(*right, kind)?)
66
+ } else {
67
+ right
68
+ };
69
+
70
+ Ok(Transformed::yes(Expr::BinaryExpr(BinaryExpr::new(
71
+ left, op, right,
72
+ ))))
73
+ }
74
+
75
+ fn canonicalize_path_in_list(
76
+ in_list: InList,
77
+ kind: FilesystemPathKind,
78
+ ) -> Result<Transformed<Expr>> {
79
+ let list = in_list
80
+ .list
81
+ .into_iter()
82
+ .map(|expr| canonicalize_path_literal_expr(expr, kind))
83
+ .collect::<Result<Vec<_>>>()?;
84
+ Ok(Transformed::yes(Expr::InList(InList::new(
85
+ in_list.expr,
86
+ list,
87
+ in_list.negated,
88
+ ))))
89
+ }
90
+
91
+ fn canonicalize_path_between(
92
+ between: Between,
93
+ kind: FilesystemPathKind,
94
+ ) -> Result<Transformed<Expr>> {
95
+ Ok(Transformed::yes(Expr::Between(Between {
96
+ expr: between.expr,
97
+ negated: between.negated,
98
+ low: Box::new(canonicalize_path_literal_expr(*between.low, kind)?),
99
+ high: Box::new(canonicalize_path_literal_expr(*between.high, kind)?),
100
+ })))
101
+ }
102
+
103
+ fn canonicalize_path_literal_expr(expr: Expr, kind: FilesystemPathKind) -> Result<Expr> {
104
+ let Expr::Literal(literal, metadata) = expr else {
105
+ return Err(unsupported_dynamic_path_predicate_error(expr));
106
+ };
107
+
108
+ match literal {
109
+ ScalarValue::Utf8(Some(value))
110
+ | ScalarValue::Utf8View(Some(value))
111
+ | ScalarValue::LargeUtf8(Some(value)) => {
112
+ let normalized = canonicalize_path_value(&value, kind)?;
113
+ Ok(Expr::Literal(ScalarValue::Utf8(Some(normalized)), metadata))
114
+ }
115
+ _ => Ok(Expr::Literal(literal, metadata)),
116
+ }
117
+ }
118
+
119
+ fn canonicalize_path_value(value: &str, kind: FilesystemPathKind) -> Result<String> {
120
+ match kind {
121
+ FilesystemPathKind::File => ParsedFilePath::try_from_path(value)
122
+ .map(|parsed| parsed.normalized_path.to_string())
123
+ .map_err(lix_error_to_datafusion_error),
124
+ FilesystemPathKind::Directory => {
125
+ normalize_directory_path(value).map_err(lix_error_to_datafusion_error)
126
+ }
127
+ }
128
+ }
129
+
130
+ fn is_path_column(expr: &Expr) -> bool {
131
+ matches!(expr, Expr::Column(column) if column.name == "path")
132
+ }
133
+
134
+ fn is_path_comparison_operator(op: Operator) -> bool {
135
+ matches!(
136
+ op,
137
+ Operator::Eq
138
+ | Operator::NotEq
139
+ | Operator::Lt
140
+ | Operator::LtEq
141
+ | Operator::Gt
142
+ | Operator::GtEq
143
+ )
144
+ }
145
+
146
+ fn unsupported_dynamic_path_predicate_error(expr: Expr) -> DataFusionError {
147
+ lix_error_to_datafusion_error(
148
+ LixError::new(
149
+ LixError::CODE_UNSUPPORTED_SQL,
150
+ format!(
151
+ "filesystem path predicates only support literal path values; found expression {expr:?}"
152
+ ),
153
+ )
154
+ .with_hint(
155
+ "Compare lix_file.path or lix_directory.path to a string literal or bound parameter. \
156
+ Computed path expressions are not supported until path canonicalization can run at evaluation time.",
157
+ ),
158
+ )
159
+ }
@@ -0,0 +1,383 @@
1
+ #![allow(dead_code)]
2
+
3
+ use std::collections::{BTreeMap, BTreeSet};
4
+ use std::sync::Arc;
5
+
6
+ use serde::Deserialize;
7
+
8
+ use crate::live_state::MaterializedLiveStateRow;
9
+ use crate::live_state::{LiveStateFilter, LiveStateReader, LiveStateScanRequest};
10
+ use crate::LixError;
11
+
12
+ use super::filesystem_planner::{
13
+ FilesystemRowContext, BLOB_REF_SCHEMA_KEY, DIRECTORY_DESCRIPTOR_SCHEMA_KEY,
14
+ FILE_DESCRIPTOR_SCHEMA_KEY,
15
+ };
16
+
17
+ /// Execution-visible filesystem metadata decoded from live-state rows.
18
+ ///
19
+ /// The helper intentionally depends only on `LiveStateReader`. In engine
20
+ /// write execution that context may include staged rows, so filesystem planning
21
+ /// sees pending writes without reaching into write-execution internals.
22
+ #[derive(Debug, Clone, PartialEq, Eq, Default)]
23
+ pub(crate) struct VisibleFilesystem {
24
+ pub(crate) directories_by_id: BTreeMap<String, VisibleDirectory>,
25
+ pub(crate) directory_children_by_parent_id: BTreeMap<Option<String>, BTreeSet<String>>,
26
+ pub(crate) files_by_directory_id: BTreeMap<Option<String>, BTreeMap<String, VisibleFile>>,
27
+ pub(crate) blob_refs_by_file_id: BTreeMap<String, VisibleBlobRef>,
28
+ }
29
+
30
+ impl VisibleFilesystem {
31
+ /// Loads filesystem rows for a single version from execution-visible live
32
+ /// state and builds lookup indexes used by filesystem write planning.
33
+ pub(crate) async fn load(
34
+ live_state: Arc<dyn LiveStateReader>,
35
+ version_id: &str,
36
+ ) -> Result<Self, LixError> {
37
+ let rows = live_state
38
+ .scan_rows(&LiveStateScanRequest {
39
+ filter: LiveStateFilter {
40
+ schema_keys: vec![
41
+ DIRECTORY_DESCRIPTOR_SCHEMA_KEY.to_string(),
42
+ FILE_DESCRIPTOR_SCHEMA_KEY.to_string(),
43
+ BLOB_REF_SCHEMA_KEY.to_string(),
44
+ ],
45
+ version_ids: vec![version_id.to_string()],
46
+ ..LiveStateFilter::default()
47
+ },
48
+ ..LiveStateScanRequest::default()
49
+ })
50
+ .await?;
51
+ Self::from_live_rows(rows)
52
+ }
53
+
54
+ /// Builds filesystem lookup indexes from rows that are already known to be
55
+ /// transaction-visible.
56
+ pub(crate) fn from_live_rows(rows: Vec<MaterializedLiveStateRow>) -> Result<Self, LixError> {
57
+ let mut visible = Self::default();
58
+
59
+ for row in rows {
60
+ let Some(snapshot_content) = row.snapshot_content.as_deref() else {
61
+ continue;
62
+ };
63
+ match row.schema_key.as_str() {
64
+ DIRECTORY_DESCRIPTOR_SCHEMA_KEY => {
65
+ let snapshot: DirectoryDescriptorSnapshot =
66
+ serde_json::from_str(snapshot_content).map_err(|error| {
67
+ LixError::new(
68
+ "LIX_ERROR_UNKNOWN",
69
+ format!("invalid lix_directory_descriptor snapshot JSON: {error}"),
70
+ )
71
+ })?;
72
+ let directory = VisibleDirectory {
73
+ id: snapshot.id,
74
+ parent_id: snapshot.parent_id,
75
+ name: snapshot.name,
76
+ hidden: snapshot.hidden.unwrap_or(false),
77
+ context: filesystem_row_context(&row)?,
78
+ };
79
+ visible
80
+ .directory_children_by_parent_id
81
+ .entry(directory.parent_id.clone())
82
+ .or_default()
83
+ .insert(directory.id.clone());
84
+ visible
85
+ .directories_by_id
86
+ .insert(directory.id.clone(), directory);
87
+ }
88
+ FILE_DESCRIPTOR_SCHEMA_KEY => {
89
+ let snapshot: FileDescriptorSnapshot = serde_json::from_str(snapshot_content)
90
+ .map_err(|error| {
91
+ LixError::new(
92
+ "LIX_ERROR_UNKNOWN",
93
+ format!("invalid lix_file_descriptor snapshot JSON: {error}"),
94
+ )
95
+ })?;
96
+ let file = VisibleFile {
97
+ id: snapshot.id,
98
+ directory_id: snapshot.directory_id,
99
+ name: snapshot.name,
100
+ hidden: snapshot.hidden,
101
+ context: filesystem_row_context(&row)?,
102
+ };
103
+ visible
104
+ .files_by_directory_id
105
+ .entry(file.directory_id.clone())
106
+ .or_default()
107
+ .insert(file.id.clone(), file);
108
+ }
109
+ BLOB_REF_SCHEMA_KEY => {
110
+ let snapshot: BlobRefSnapshot = serde_json::from_str(snapshot_content)
111
+ .map_err(|error| {
112
+ LixError::new(
113
+ "LIX_ERROR_UNKNOWN",
114
+ format!("invalid lix_binary_blob_ref snapshot JSON: {error}"),
115
+ )
116
+ })?;
117
+ visible.blob_refs_by_file_id.insert(
118
+ snapshot.id.clone(),
119
+ VisibleBlobRef {
120
+ file_id: snapshot.id,
121
+ blob_hash: snapshot.blob_hash,
122
+ size_bytes: snapshot.size_bytes,
123
+ context: filesystem_row_context(&row)?,
124
+ },
125
+ );
126
+ }
127
+ _ => {}
128
+ }
129
+ }
130
+
131
+ Ok(visible)
132
+ }
133
+ }
134
+
135
+ #[derive(Debug, Clone, PartialEq, Eq)]
136
+ pub(crate) struct VisibleDirectory {
137
+ pub(crate) id: String,
138
+ pub(crate) parent_id: Option<String>,
139
+ pub(crate) name: String,
140
+ pub(crate) hidden: bool,
141
+ pub(crate) context: FilesystemRowContext,
142
+ }
143
+
144
+ #[derive(Debug, Clone, PartialEq, Eq)]
145
+ pub(crate) struct VisibleFile {
146
+ pub(crate) id: String,
147
+ pub(crate) directory_id: Option<String>,
148
+ pub(crate) name: String,
149
+ pub(crate) hidden: bool,
150
+ pub(crate) context: FilesystemRowContext,
151
+ }
152
+
153
+ #[derive(Debug, Clone, PartialEq, Eq)]
154
+ pub(crate) struct VisibleBlobRef {
155
+ pub(crate) file_id: String,
156
+ pub(crate) blob_hash: String,
157
+ pub(crate) size_bytes: Option<u64>,
158
+ pub(crate) context: FilesystemRowContext,
159
+ }
160
+
161
+ #[derive(Debug, Deserialize)]
162
+ struct DirectoryDescriptorSnapshot {
163
+ id: String,
164
+ parent_id: Option<String>,
165
+ name: String,
166
+ hidden: Option<bool>,
167
+ }
168
+
169
+ #[derive(Debug, Deserialize)]
170
+ struct FileDescriptorSnapshot {
171
+ id: String,
172
+ directory_id: Option<String>,
173
+ name: String,
174
+ hidden: bool,
175
+ }
176
+
177
+ #[derive(Debug, Deserialize)]
178
+ struct BlobRefSnapshot {
179
+ id: String,
180
+ blob_hash: String,
181
+ size_bytes: Option<u64>,
182
+ }
183
+
184
+ fn filesystem_row_context(
185
+ row: &MaterializedLiveStateRow,
186
+ ) -> Result<FilesystemRowContext, LixError> {
187
+ Ok(FilesystemRowContext {
188
+ version_id: row.version_id.clone(),
189
+ global: row.global,
190
+ untracked: row.untracked,
191
+ file_id: row.file_id.clone(),
192
+ metadata: row
193
+ .metadata
194
+ .as_deref()
195
+ .map(|metadata| {
196
+ crate::parse_row_metadata_value(metadata, "filesystem row metadata").and_then(
197
+ |metadata| {
198
+ crate::transaction::types::TransactionJson::from_value(
199
+ metadata,
200
+ "filesystem row metadata",
201
+ )
202
+ },
203
+ )
204
+ })
205
+ .transpose()?,
206
+ })
207
+ }
208
+
209
+ #[cfg(test)]
210
+ mod tests {
211
+ use async_trait::async_trait;
212
+
213
+ use crate::live_state::MaterializedLiveStateRow;
214
+ use crate::live_state::{LiveStateReader, LiveStateRowRequest, LiveStateScanRequest};
215
+ use crate::LixError;
216
+
217
+ use super::{
218
+ VisibleFilesystem, BLOB_REF_SCHEMA_KEY, DIRECTORY_DESCRIPTOR_SCHEMA_KEY,
219
+ FILE_DESCRIPTOR_SCHEMA_KEY,
220
+ };
221
+
222
+ #[tokio::test]
223
+ async fn nested_directories_resolve_correctly() {
224
+ let filesystem = VisibleFilesystem::load(
225
+ live_state(vec![
226
+ directory_row(
227
+ "dir-docs",
228
+ r#"{"id":"dir-docs","parent_id":null,"name":"docs","hidden":false}"#,
229
+ ),
230
+ directory_row(
231
+ "dir-guides",
232
+ r#"{"id":"dir-guides","parent_id":"dir-docs","name":"guides","hidden":false}"#,
233
+ ),
234
+ ]),
235
+ "version-a",
236
+ )
237
+ .await
238
+ .expect("visible filesystem should load");
239
+
240
+ assert_eq!(
241
+ filesystem
242
+ .directories_by_id
243
+ .get("dir-guides")
244
+ .and_then(|directory| directory.parent_id.as_deref()),
245
+ Some("dir-docs")
246
+ );
247
+ assert!(filesystem
248
+ .directory_children_by_parent_id
249
+ .get(&None)
250
+ .is_some_and(|children| children.contains("dir-docs")));
251
+ assert!(filesystem
252
+ .directory_children_by_parent_id
253
+ .get(&Some("dir-docs".to_string()))
254
+ .is_some_and(|children| children.contains("dir-guides")));
255
+ }
256
+
257
+ #[tokio::test]
258
+ async fn files_attach_to_directory_ids() {
259
+ let filesystem = VisibleFilesystem::load(
260
+ live_state(vec![file_row(
261
+ "file-readme",
262
+ r#"{"id":"file-readme","directory_id":"dir-guides","name":"readme.md","hidden":false}"#,
263
+ )]),
264
+ "version-a",
265
+ )
266
+ .await
267
+ .expect("visible filesystem should load");
268
+
269
+ let files = filesystem
270
+ .files_by_directory_id
271
+ .get(&Some("dir-guides".to_string()))
272
+ .expect("directory should have attached files");
273
+ let file = files
274
+ .get("file-readme")
275
+ .expect("file should be indexed by id inside directory");
276
+ assert_eq!(file.name, "readme.md");
277
+ }
278
+
279
+ #[tokio::test]
280
+ async fn blob_refs_attach_to_file_ids() {
281
+ let filesystem = VisibleFilesystem::load(
282
+ live_state(vec![blob_ref_row(
283
+ "file-readme",
284
+ r#"{"id":"file-readme","blob_hash":"abc123","size_bytes":5}"#,
285
+ )]),
286
+ "version-a",
287
+ )
288
+ .await
289
+ .expect("visible filesystem should load");
290
+
291
+ let blob_ref = filesystem
292
+ .blob_refs_by_file_id
293
+ .get("file-readme")
294
+ .expect("blob ref should be indexed by file id");
295
+ assert_eq!(blob_ref.blob_hash, "abc123");
296
+ assert_eq!(blob_ref.size_bytes, Some(5));
297
+ }
298
+
299
+ fn live_state(rows: Vec<MaterializedLiveStateRow>) -> std::sync::Arc<dyn LiveStateReader> {
300
+ std::sync::Arc::new(RowsLiveStateReader { rows })
301
+ }
302
+
303
+ struct RowsLiveStateReader {
304
+ rows: Vec<MaterializedLiveStateRow>,
305
+ }
306
+
307
+ #[async_trait]
308
+ impl LiveStateReader for RowsLiveStateReader {
309
+ async fn scan_rows(
310
+ &self,
311
+ request: &LiveStateScanRequest,
312
+ ) -> Result<Vec<MaterializedLiveStateRow>, LixError> {
313
+ Ok(self
314
+ .rows
315
+ .iter()
316
+ .filter(|row| {
317
+ (request.filter.schema_keys.is_empty()
318
+ || request.filter.schema_keys.contains(&row.schema_key))
319
+ && (request.filter.version_ids.is_empty()
320
+ || request.filter.version_ids.contains(&row.version_id))
321
+ })
322
+ .cloned()
323
+ .collect())
324
+ }
325
+
326
+ async fn load_row(
327
+ &self,
328
+ _request: &LiveStateRowRequest,
329
+ ) -> Result<Option<MaterializedLiveStateRow>, LixError> {
330
+ Ok(None)
331
+ }
332
+ }
333
+
334
+ fn directory_row(entity_id: &str, snapshot_content: &str) -> MaterializedLiveStateRow {
335
+ live_row(
336
+ entity_id,
337
+ DIRECTORY_DESCRIPTOR_SCHEMA_KEY,
338
+ None,
339
+ snapshot_content,
340
+ )
341
+ }
342
+
343
+ fn file_row(entity_id: &str, snapshot_content: &str) -> MaterializedLiveStateRow {
344
+ live_row(
345
+ entity_id,
346
+ FILE_DESCRIPTOR_SCHEMA_KEY,
347
+ None,
348
+ snapshot_content,
349
+ )
350
+ }
351
+
352
+ fn blob_ref_row(entity_id: &str, snapshot_content: &str) -> MaterializedLiveStateRow {
353
+ live_row(
354
+ entity_id,
355
+ BLOB_REF_SCHEMA_KEY,
356
+ Some(entity_id.to_string()),
357
+ snapshot_content,
358
+ )
359
+ }
360
+
361
+ fn live_row(
362
+ entity_id: &str,
363
+ schema_key: &str,
364
+ file_id: Option<String>,
365
+ snapshot_content: &str,
366
+ ) -> MaterializedLiveStateRow {
367
+ MaterializedLiveStateRow {
368
+ entity_id: crate::entity_identity::EntityIdentity::single(entity_id),
369
+ schema_key: schema_key.to_string(),
370
+ file_id,
371
+ snapshot_content: Some(snapshot_content.to_string()),
372
+ metadata: None,
373
+ deleted: false,
374
+ version_id: "version-a".to_string(),
375
+ change_id: Some(format!("change-{entity_id}")),
376
+ commit_id: Some(format!("commit-{entity_id}")),
377
+ global: false,
378
+ untracked: false,
379
+ created_at: "2026-04-23T00:00:00Z".to_string(),
380
+ updated_at: "2026-04-23T01:00:00Z".to_string(),
381
+ }
382
+ }
383
+ }
@@ -0,0 +1,56 @@
1
+ use serde_json::Value as JsonValue;
2
+
3
+ use crate::entity_identity::EntityIdentity;
4
+ use crate::LixError;
5
+
6
+ /// Shared projection contract for typed history views.
7
+ ///
8
+ /// On tombstone rows (`snapshot_content IS NULL`), identity columns survive by
9
+ /// projecting from canonical entity identity. Non-identity columns must remain
10
+ /// NULL because there is no snapshot to project payload from.
11
+ pub(crate) enum HistoryIdentityProjection<'a> {
12
+ PrimaryKeyPaths(&'a [Vec<String>]),
13
+ SingleColumn { column: &'a str },
14
+ }
15
+
16
+ pub(crate) fn tombstone_identity_column_value(
17
+ column_name: &str,
18
+ entity_id: &str,
19
+ projection: HistoryIdentityProjection<'_>,
20
+ ) -> Result<Option<JsonValue>, LixError> {
21
+ match projection {
22
+ HistoryIdentityProjection::SingleColumn { column } => {
23
+ if column_name == column {
24
+ Ok(Some(JsonValue::String(entity_id.to_string())))
25
+ } else {
26
+ Ok(None)
27
+ }
28
+ }
29
+ HistoryIdentityProjection::PrimaryKeyPaths(primary_key_paths) => {
30
+ primary_key_tombstone_value(column_name, entity_id, primary_key_paths)
31
+ }
32
+ }
33
+ }
34
+
35
+ fn primary_key_tombstone_value(
36
+ column_name: &str,
37
+ entity_id: &str,
38
+ primary_key_paths: &[Vec<String>],
39
+ ) -> Result<Option<JsonValue>, LixError> {
40
+ let Some(part_index) = primary_key_paths
41
+ .iter()
42
+ .position(|path| path.as_slice() == [column_name])
43
+ else {
44
+ return Ok(None);
45
+ };
46
+
47
+ let identity = EntityIdentity::from_json_array_text(entity_id).map_err(|error| {
48
+ LixError::unknown(format!(
49
+ "failed to decode history tombstone entity identity: {error}"
50
+ ))
51
+ })?;
52
+ Ok(identity
53
+ .parts
54
+ .get(part_index)
55
+ .map(|part| JsonValue::String(part.clone())))
56
+ }