@lix-js/sdk 0.6.0-preview.1 → 0.6.0-preview.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/SKILL.md +304 -320
- package/dist/engine-wasm/wasm/lix_engine.d.ts +5 -0
- package/dist/engine-wasm/wasm/lix_engine.js +9 -13
- package/dist/engine-wasm/wasm/lix_engine.wasm +0 -0
- package/dist/engine-wasm/wasm/lix_engine.wasm.d.ts +1 -0
- package/dist/generated/builtin-schemas.d.ts +87 -162
- package/dist/generated/builtin-schemas.js +139 -236
- package/dist/open-lix.d.ts +103 -14
- package/dist/open-lix.js +3 -0
- package/dist/sqlite/index.js +99 -22
- package/dist-engine-src/README.md +18 -0
- package/dist-engine-src/src/backend/kv.rs +358 -0
- package/dist-engine-src/src/backend/mod.rs +12 -0
- package/dist-engine-src/src/backend/testing.rs +658 -0
- package/dist-engine-src/src/backend/types.rs +96 -0
- package/dist-engine-src/src/binary_cas/chunking.rs +31 -0
- package/dist-engine-src/src/binary_cas/codec.rs +346 -0
- package/dist-engine-src/src/binary_cas/context.rs +139 -0
- package/dist-engine-src/src/binary_cas/kv.rs +1063 -0
- package/dist-engine-src/src/binary_cas/mod.rs +11 -0
- package/dist-engine-src/src/binary_cas/types.rs +121 -0
- package/dist-engine-src/src/catalog/context.rs +412 -0
- package/dist-engine-src/src/catalog/mod.rs +10 -0
- package/dist-engine-src/src/catalog/schema.rs +4 -0
- package/dist-engine-src/src/catalog/snapshot.rs +1114 -0
- package/dist-engine-src/src/cel/context.rs +86 -0
- package/dist-engine-src/src/cel/error.rs +19 -0
- package/dist-engine-src/src/cel/mod.rs +8 -0
- package/dist-engine-src/src/cel/provider.rs +9 -0
- package/dist-engine-src/src/cel/runtime.rs +167 -0
- package/dist-engine-src/src/cel/value.rs +50 -0
- package/dist-engine-src/src/commit_graph/context.rs +901 -0
- package/dist-engine-src/src/commit_graph/mod.rs +11 -0
- package/dist-engine-src/src/commit_graph/types.rs +109 -0
- package/dist-engine-src/src/commit_graph/walker.rs +756 -0
- package/dist-engine-src/src/commit_store/codec.rs +887 -0
- package/dist-engine-src/src/commit_store/context.rs +944 -0
- package/dist-engine-src/src/commit_store/materialization.rs +84 -0
- package/dist-engine-src/src/commit_store/mod.rs +16 -0
- package/dist-engine-src/src/commit_store/storage.rs +600 -0
- package/dist-engine-src/src/commit_store/types.rs +215 -0
- package/dist-engine-src/src/common/error.rs +313 -0
- package/dist-engine-src/src/common/fingerprint.rs +3 -0
- package/dist-engine-src/src/common/fs_path.rs +1336 -0
- package/dist-engine-src/src/common/identity.rs +145 -0
- package/dist-engine-src/src/common/json_pointer.rs +67 -0
- package/dist-engine-src/src/common/metadata.rs +40 -0
- package/dist-engine-src/src/common/mod.rs +23 -0
- package/dist-engine-src/src/common/types.rs +105 -0
- package/dist-engine-src/src/common/wire.rs +222 -0
- package/dist-engine-src/src/domain.rs +324 -0
- package/dist-engine-src/src/engine.rs +225 -0
- package/dist-engine-src/src/entity_identity.rs +405 -0
- package/dist-engine-src/src/functions/context.rs +292 -0
- package/dist-engine-src/src/functions/deterministic.rs +113 -0
- package/dist-engine-src/src/functions/mod.rs +18 -0
- package/dist-engine-src/src/functions/provider.rs +130 -0
- package/dist-engine-src/src/functions/state.rs +336 -0
- package/dist-engine-src/src/functions/types.rs +37 -0
- package/dist-engine-src/src/init.rs +558 -0
- package/dist-engine-src/src/json_store/compression.rs +77 -0
- package/dist-engine-src/src/json_store/context.rs +423 -0
- package/dist-engine-src/src/json_store/encoded.rs +15 -0
- package/dist-engine-src/src/json_store/mod.rs +12 -0
- package/dist-engine-src/src/json_store/store.rs +1109 -0
- package/dist-engine-src/src/json_store/types.rs +217 -0
- package/dist-engine-src/src/lib.rs +62 -0
- package/dist-engine-src/src/live_state/context.rs +2019 -0
- package/dist-engine-src/src/live_state/mod.rs +15 -0
- package/dist-engine-src/src/live_state/overlay.rs +75 -0
- package/dist-engine-src/src/live_state/reader.rs +23 -0
- package/dist-engine-src/src/live_state/types.rs +222 -0
- package/dist-engine-src/src/live_state/visibility.rs +223 -0
- package/dist-engine-src/src/plugin/archive.rs +438 -0
- package/dist-engine-src/src/plugin/component.rs +183 -0
- package/dist-engine-src/src/plugin/install.rs +619 -0
- package/dist-engine-src/src/plugin/manifest.rs +516 -0
- package/dist-engine-src/src/plugin/materializer.rs +477 -0
- package/dist-engine-src/src/plugin/mod.rs +33 -0
- package/dist-engine-src/src/plugin/plugin_manifest.json +118 -0
- package/dist-engine-src/src/plugin/storage.rs +74 -0
- package/dist-engine-src/src/schema/annotations/defaults.rs +275 -0
- package/dist-engine-src/src/schema/annotations/mod.rs +1 -0
- package/dist-engine-src/src/schema/builtin/lix_account.json +21 -0
- package/dist-engine-src/src/schema/builtin/lix_active_account.json +29 -0
- package/dist-engine-src/src/schema/builtin/lix_binary_blob_ref.json +29 -0
- package/dist-engine-src/src/schema/builtin/lix_change.json +63 -0
- package/dist-engine-src/src/schema/builtin/lix_change_author.json +45 -0
- package/dist-engine-src/src/schema/builtin/lix_commit.json +24 -0
- package/dist-engine-src/src/schema/builtin/lix_commit_edge.json +53 -0
- package/dist-engine-src/src/schema/builtin/lix_directory_descriptor.json +52 -0
- package/dist-engine-src/src/schema/builtin/lix_file_descriptor.json +52 -0
- package/dist-engine-src/src/schema/builtin/lix_key_value.json +40 -0
- package/dist-engine-src/src/schema/builtin/lix_label.json +29 -0
- package/dist-engine-src/src/schema/builtin/lix_label_assignment.json +74 -0
- package/dist-engine-src/src/schema/builtin/lix_registered_schema.json +25 -0
- package/dist-engine-src/src/schema/builtin/lix_version_descriptor.json +34 -0
- package/dist-engine-src/src/schema/builtin/lix_version_ref.json +48 -0
- package/dist-engine-src/src/schema/builtin/mod.rs +222 -0
- package/dist-engine-src/src/schema/compatibility.rs +787 -0
- package/dist-engine-src/src/schema/definition.json +187 -0
- package/dist-engine-src/src/schema/definition.rs +742 -0
- package/dist-engine-src/src/schema/key.rs +138 -0
- package/dist-engine-src/src/schema/mod.rs +20 -0
- package/dist-engine-src/src/schema/seed.rs +14 -0
- package/dist-engine-src/src/schema/tests.rs +780 -0
- package/dist-engine-src/src/session/context.rs +364 -0
- package/dist-engine-src/src/session/create_version.rs +88 -0
- package/dist-engine-src/src/session/execute.rs +478 -0
- package/dist-engine-src/src/session/merge/analysis.rs +102 -0
- package/dist-engine-src/src/session/merge/apply.rs +23 -0
- package/dist-engine-src/src/session/merge/conflicts.rs +63 -0
- package/dist-engine-src/src/session/merge/mod.rs +11 -0
- package/dist-engine-src/src/session/merge/stats.rs +65 -0
- package/dist-engine-src/src/session/merge/version.rs +427 -0
- package/dist-engine-src/src/session/mod.rs +27 -0
- package/dist-engine-src/src/session/optimization9_sql2_bench.rs +100 -0
- package/dist-engine-src/src/session/switch_version.rs +109 -0
- package/dist-engine-src/src/sql2/change_provider.rs +331 -0
- package/dist-engine-src/src/sql2/classify.rs +182 -0
- package/dist-engine-src/src/sql2/context.rs +311 -0
- package/dist-engine-src/src/sql2/directory_history_provider.rs +631 -0
- package/dist-engine-src/src/sql2/directory_provider.rs +2453 -0
- package/dist-engine-src/src/sql2/dml.rs +148 -0
- package/dist-engine-src/src/sql2/entity_history_provider.rs +440 -0
- package/dist-engine-src/src/sql2/entity_provider.rs +3211 -0
- package/dist-engine-src/src/sql2/error.rs +216 -0
- package/dist-engine-src/src/sql2/execute.rs +3440 -0
- package/dist-engine-src/src/sql2/file_history_provider.rs +910 -0
- package/dist-engine-src/src/sql2/file_provider.rs +3679 -0
- package/dist-engine-src/src/sql2/filesystem_planner.rs +1490 -0
- package/dist-engine-src/src/sql2/filesystem_predicates.rs +159 -0
- package/dist-engine-src/src/sql2/filesystem_visibility.rs +383 -0
- package/dist-engine-src/src/sql2/history_projection.rs +56 -0
- package/dist-engine-src/src/sql2/history_provider.rs +412 -0
- package/dist-engine-src/src/sql2/history_route.rs +657 -0
- package/dist-engine-src/src/sql2/lix_state_provider.rs +2512 -0
- package/dist-engine-src/src/sql2/mod.rs +46 -0
- package/dist-engine-src/src/sql2/predicate_typecheck.rs +246 -0
- package/dist-engine-src/src/sql2/public_bind/assignment.rs +46 -0
- package/dist-engine-src/src/sql2/public_bind/capability.rs +41 -0
- package/dist-engine-src/src/sql2/public_bind/dml.rs +166 -0
- package/dist-engine-src/src/sql2/public_bind/mod.rs +25 -0
- package/dist-engine-src/src/sql2/public_bind/table.rs +168 -0
- package/dist-engine-src/src/sql2/read_only.rs +63 -0
- package/dist-engine-src/src/sql2/record_batch.rs +17 -0
- package/dist-engine-src/src/sql2/result_metadata.rs +29 -0
- package/dist-engine-src/src/sql2/runtime.rs +60 -0
- package/dist-engine-src/src/sql2/session.rs +132 -0
- package/dist-engine-src/src/sql2/udfs/common.rs +295 -0
- package/dist-engine-src/src/sql2/udfs/lix_active_version_commit_id.rs +53 -0
- package/dist-engine-src/src/sql2/udfs/lix_empty_blob.rs +47 -0
- package/dist-engine-src/src/sql2/udfs/lix_json.rs +100 -0
- package/dist-engine-src/src/sql2/udfs/lix_json_get.rs +99 -0
- package/dist-engine-src/src/sql2/udfs/lix_json_get_text.rs +99 -0
- package/dist-engine-src/src/sql2/udfs/lix_text_decode.rs +82 -0
- package/dist-engine-src/src/sql2/udfs/lix_text_encode.rs +85 -0
- package/dist-engine-src/src/sql2/udfs/lix_timestamp.rs +76 -0
- package/dist-engine-src/src/sql2/udfs/lix_uuid_v7.rs +76 -0
- package/dist-engine-src/src/sql2/udfs/mod.rs +89 -0
- package/dist-engine-src/src/sql2/udfs/public_call.rs +211 -0
- package/dist-engine-src/src/sql2/version_provider.rs +1202 -0
- package/dist-engine-src/src/sql2/version_scope.rs +394 -0
- package/dist-engine-src/src/sql2/write_normalization.rs +345 -0
- package/dist-engine-src/src/storage/context.rs +356 -0
- package/dist-engine-src/src/storage/mod.rs +14 -0
- package/dist-engine-src/src/storage/read_scope.rs +88 -0
- package/dist-engine-src/src/storage/types.rs +501 -0
- package/dist-engine-src/src/storage_bench.rs +4863 -0
- package/dist-engine-src/src/test_support.rs +228 -0
- package/dist-engine-src/src/tracked_state/by_file_index.rs +98 -0
- package/dist-engine-src/src/tracked_state/codec.rs +2085 -0
- package/dist-engine-src/src/tracked_state/context.rs +1867 -0
- package/dist-engine-src/src/tracked_state/diff.rs +686 -0
- package/dist-engine-src/src/tracked_state/materialization.rs +403 -0
- package/dist-engine-src/src/tracked_state/materializer.rs +488 -0
- package/dist-engine-src/src/tracked_state/merge.rs +492 -0
- package/dist-engine-src/src/tracked_state/mod.rs +32 -0
- package/dist-engine-src/src/tracked_state/storage.rs +375 -0
- package/dist-engine-src/src/tracked_state/tree.rs +3187 -0
- package/dist-engine-src/src/tracked_state/types.rs +231 -0
- package/dist-engine-src/src/transaction/commit.rs +1484 -0
- package/dist-engine-src/src/transaction/context.rs +1548 -0
- package/dist-engine-src/src/transaction/live_state_overlay.rs +35 -0
- package/dist-engine-src/src/transaction/mod.rs +13 -0
- package/dist-engine-src/src/transaction/normalization.rs +890 -0
- package/dist-engine-src/src/transaction/prep.rs +37 -0
- package/dist-engine-src/src/transaction/schema_resolver.rs +149 -0
- package/dist-engine-src/src/transaction/staging.rs +1731 -0
- package/dist-engine-src/src/transaction/types.rs +460 -0
- package/dist-engine-src/src/transaction/validation.rs +5830 -0
- package/dist-engine-src/src/untracked_state/codec.rs +307 -0
- package/dist-engine-src/src/untracked_state/context.rs +98 -0
- package/dist-engine-src/src/untracked_state/materialization.rs +63 -0
- package/dist-engine-src/src/untracked_state/mod.rs +15 -0
- package/dist-engine-src/src/untracked_state/storage.rs +396 -0
- package/dist-engine-src/src/untracked_state/types.rs +146 -0
- package/dist-engine-src/src/version/context.rs +40 -0
- package/dist-engine-src/src/version/lifecycle.rs +221 -0
- package/dist-engine-src/src/version/mod.rs +13 -0
- package/dist-engine-src/src/version/refs.rs +330 -0
- package/dist-engine-src/src/version/stage_rows.rs +67 -0
- package/dist-engine-src/src/version/types.rs +21 -0
- package/dist-engine-src/src/wasm/mod.rs +60 -0
- package/package.json +68 -64
|
@@ -0,0 +1,159 @@
|
|
|
1
|
+
use datafusion::common::tree_node::{Transformed, TreeNode};
|
|
2
|
+
use datafusion::common::{DataFusionError, Result, ScalarValue};
|
|
3
|
+
use datafusion::logical_expr::expr::{Between, InList};
|
|
4
|
+
use datafusion::logical_expr::{BinaryExpr, Expr, Operator};
|
|
5
|
+
|
|
6
|
+
use crate::common::{normalize_directory_path, ParsedFilePath};
|
|
7
|
+
use crate::LixError;
|
|
8
|
+
|
|
9
|
+
use super::error::lix_error_to_datafusion_error;
|
|
10
|
+
|
|
11
|
+
#[derive(Debug, Clone, Copy)]
|
|
12
|
+
pub(crate) enum FilesystemPathKind {
|
|
13
|
+
File,
|
|
14
|
+
Directory,
|
|
15
|
+
}
|
|
16
|
+
|
|
17
|
+
pub(crate) fn canonicalize_filesystem_path_filters(
|
|
18
|
+
filters: &[Expr],
|
|
19
|
+
kind: FilesystemPathKind,
|
|
20
|
+
) -> Result<Vec<Expr>> {
|
|
21
|
+
filters
|
|
22
|
+
.iter()
|
|
23
|
+
.cloned()
|
|
24
|
+
.map(|filter| canonicalize_filesystem_path_filter(filter, kind))
|
|
25
|
+
.collect()
|
|
26
|
+
}
|
|
27
|
+
|
|
28
|
+
fn canonicalize_filesystem_path_filter(expr: Expr, kind: FilesystemPathKind) -> Result<Expr> {
|
|
29
|
+
expr.transform(|expr| canonicalize_filesystem_path_expr(expr, kind))
|
|
30
|
+
.map(|transformed| transformed.data)
|
|
31
|
+
}
|
|
32
|
+
|
|
33
|
+
fn canonicalize_filesystem_path_expr(
|
|
34
|
+
expr: Expr,
|
|
35
|
+
kind: FilesystemPathKind,
|
|
36
|
+
) -> Result<Transformed<Expr>> {
|
|
37
|
+
match expr {
|
|
38
|
+
Expr::BinaryExpr(binary_expr) if is_path_comparison_operator(binary_expr.op) => {
|
|
39
|
+
canonicalize_path_binary_expr(binary_expr, kind)
|
|
40
|
+
}
|
|
41
|
+
Expr::InList(in_list) if is_path_column(&in_list.expr) => {
|
|
42
|
+
canonicalize_path_in_list(in_list, kind)
|
|
43
|
+
}
|
|
44
|
+
Expr::Between(between) if is_path_column(&between.expr) => {
|
|
45
|
+
canonicalize_path_between(between, kind)
|
|
46
|
+
}
|
|
47
|
+
_ => Ok(Transformed::no(expr)),
|
|
48
|
+
}
|
|
49
|
+
}
|
|
50
|
+
|
|
51
|
+
fn canonicalize_path_binary_expr(
|
|
52
|
+
binary_expr: BinaryExpr,
|
|
53
|
+
kind: FilesystemPathKind,
|
|
54
|
+
) -> Result<Transformed<Expr>> {
|
|
55
|
+
let BinaryExpr { left, op, right } = binary_expr;
|
|
56
|
+
let left_is_path = is_path_column(&left);
|
|
57
|
+
let right_is_path = is_path_column(&right);
|
|
58
|
+
|
|
59
|
+
let left = if right_is_path {
|
|
60
|
+
Box::new(canonicalize_path_literal_expr(*left, kind)?)
|
|
61
|
+
} else {
|
|
62
|
+
left
|
|
63
|
+
};
|
|
64
|
+
let right = if left_is_path {
|
|
65
|
+
Box::new(canonicalize_path_literal_expr(*right, kind)?)
|
|
66
|
+
} else {
|
|
67
|
+
right
|
|
68
|
+
};
|
|
69
|
+
|
|
70
|
+
Ok(Transformed::yes(Expr::BinaryExpr(BinaryExpr::new(
|
|
71
|
+
left, op, right,
|
|
72
|
+
))))
|
|
73
|
+
}
|
|
74
|
+
|
|
75
|
+
fn canonicalize_path_in_list(
|
|
76
|
+
in_list: InList,
|
|
77
|
+
kind: FilesystemPathKind,
|
|
78
|
+
) -> Result<Transformed<Expr>> {
|
|
79
|
+
let list = in_list
|
|
80
|
+
.list
|
|
81
|
+
.into_iter()
|
|
82
|
+
.map(|expr| canonicalize_path_literal_expr(expr, kind))
|
|
83
|
+
.collect::<Result<Vec<_>>>()?;
|
|
84
|
+
Ok(Transformed::yes(Expr::InList(InList::new(
|
|
85
|
+
in_list.expr,
|
|
86
|
+
list,
|
|
87
|
+
in_list.negated,
|
|
88
|
+
))))
|
|
89
|
+
}
|
|
90
|
+
|
|
91
|
+
fn canonicalize_path_between(
|
|
92
|
+
between: Between,
|
|
93
|
+
kind: FilesystemPathKind,
|
|
94
|
+
) -> Result<Transformed<Expr>> {
|
|
95
|
+
Ok(Transformed::yes(Expr::Between(Between {
|
|
96
|
+
expr: between.expr,
|
|
97
|
+
negated: between.negated,
|
|
98
|
+
low: Box::new(canonicalize_path_literal_expr(*between.low, kind)?),
|
|
99
|
+
high: Box::new(canonicalize_path_literal_expr(*between.high, kind)?),
|
|
100
|
+
})))
|
|
101
|
+
}
|
|
102
|
+
|
|
103
|
+
fn canonicalize_path_literal_expr(expr: Expr, kind: FilesystemPathKind) -> Result<Expr> {
|
|
104
|
+
let Expr::Literal(literal, metadata) = expr else {
|
|
105
|
+
return Err(unsupported_dynamic_path_predicate_error(expr));
|
|
106
|
+
};
|
|
107
|
+
|
|
108
|
+
match literal {
|
|
109
|
+
ScalarValue::Utf8(Some(value))
|
|
110
|
+
| ScalarValue::Utf8View(Some(value))
|
|
111
|
+
| ScalarValue::LargeUtf8(Some(value)) => {
|
|
112
|
+
let normalized = canonicalize_path_value(&value, kind)?;
|
|
113
|
+
Ok(Expr::Literal(ScalarValue::Utf8(Some(normalized)), metadata))
|
|
114
|
+
}
|
|
115
|
+
_ => Ok(Expr::Literal(literal, metadata)),
|
|
116
|
+
}
|
|
117
|
+
}
|
|
118
|
+
|
|
119
|
+
fn canonicalize_path_value(value: &str, kind: FilesystemPathKind) -> Result<String> {
|
|
120
|
+
match kind {
|
|
121
|
+
FilesystemPathKind::File => ParsedFilePath::try_from_path(value)
|
|
122
|
+
.map(|parsed| parsed.normalized_path.to_string())
|
|
123
|
+
.map_err(lix_error_to_datafusion_error),
|
|
124
|
+
FilesystemPathKind::Directory => {
|
|
125
|
+
normalize_directory_path(value).map_err(lix_error_to_datafusion_error)
|
|
126
|
+
}
|
|
127
|
+
}
|
|
128
|
+
}
|
|
129
|
+
|
|
130
|
+
fn is_path_column(expr: &Expr) -> bool {
|
|
131
|
+
matches!(expr, Expr::Column(column) if column.name == "path")
|
|
132
|
+
}
|
|
133
|
+
|
|
134
|
+
fn is_path_comparison_operator(op: Operator) -> bool {
|
|
135
|
+
matches!(
|
|
136
|
+
op,
|
|
137
|
+
Operator::Eq
|
|
138
|
+
| Operator::NotEq
|
|
139
|
+
| Operator::Lt
|
|
140
|
+
| Operator::LtEq
|
|
141
|
+
| Operator::Gt
|
|
142
|
+
| Operator::GtEq
|
|
143
|
+
)
|
|
144
|
+
}
|
|
145
|
+
|
|
146
|
+
fn unsupported_dynamic_path_predicate_error(expr: Expr) -> DataFusionError {
|
|
147
|
+
lix_error_to_datafusion_error(
|
|
148
|
+
LixError::new(
|
|
149
|
+
LixError::CODE_UNSUPPORTED_SQL,
|
|
150
|
+
format!(
|
|
151
|
+
"filesystem path predicates only support literal path values; found expression {expr:?}"
|
|
152
|
+
),
|
|
153
|
+
)
|
|
154
|
+
.with_hint(
|
|
155
|
+
"Compare lix_file.path or lix_directory.path to a string literal or bound parameter. \
|
|
156
|
+
Computed path expressions are not supported until path canonicalization can run at evaluation time.",
|
|
157
|
+
),
|
|
158
|
+
)
|
|
159
|
+
}
|
|
@@ -0,0 +1,383 @@
|
|
|
1
|
+
#![allow(dead_code)]
|
|
2
|
+
|
|
3
|
+
use std::collections::{BTreeMap, BTreeSet};
|
|
4
|
+
use std::sync::Arc;
|
|
5
|
+
|
|
6
|
+
use serde::Deserialize;
|
|
7
|
+
|
|
8
|
+
use crate::live_state::MaterializedLiveStateRow;
|
|
9
|
+
use crate::live_state::{LiveStateFilter, LiveStateReader, LiveStateScanRequest};
|
|
10
|
+
use crate::LixError;
|
|
11
|
+
|
|
12
|
+
use super::filesystem_planner::{
|
|
13
|
+
FilesystemRowContext, BLOB_REF_SCHEMA_KEY, DIRECTORY_DESCRIPTOR_SCHEMA_KEY,
|
|
14
|
+
FILE_DESCRIPTOR_SCHEMA_KEY,
|
|
15
|
+
};
|
|
16
|
+
|
|
17
|
+
/// Execution-visible filesystem metadata decoded from live-state rows.
|
|
18
|
+
///
|
|
19
|
+
/// The helper intentionally depends only on `LiveStateReader`. In engine
|
|
20
|
+
/// write execution that context may include staged rows, so filesystem planning
|
|
21
|
+
/// sees pending writes without reaching into write-execution internals.
|
|
22
|
+
#[derive(Debug, Clone, PartialEq, Eq, Default)]
|
|
23
|
+
pub(crate) struct VisibleFilesystem {
|
|
24
|
+
pub(crate) directories_by_id: BTreeMap<String, VisibleDirectory>,
|
|
25
|
+
pub(crate) directory_children_by_parent_id: BTreeMap<Option<String>, BTreeSet<String>>,
|
|
26
|
+
pub(crate) files_by_directory_id: BTreeMap<Option<String>, BTreeMap<String, VisibleFile>>,
|
|
27
|
+
pub(crate) blob_refs_by_file_id: BTreeMap<String, VisibleBlobRef>,
|
|
28
|
+
}
|
|
29
|
+
|
|
30
|
+
impl VisibleFilesystem {
|
|
31
|
+
/// Loads filesystem rows for a single version from execution-visible live
|
|
32
|
+
/// state and builds lookup indexes used by filesystem write planning.
|
|
33
|
+
pub(crate) async fn load(
|
|
34
|
+
live_state: Arc<dyn LiveStateReader>,
|
|
35
|
+
version_id: &str,
|
|
36
|
+
) -> Result<Self, LixError> {
|
|
37
|
+
let rows = live_state
|
|
38
|
+
.scan_rows(&LiveStateScanRequest {
|
|
39
|
+
filter: LiveStateFilter {
|
|
40
|
+
schema_keys: vec![
|
|
41
|
+
DIRECTORY_DESCRIPTOR_SCHEMA_KEY.to_string(),
|
|
42
|
+
FILE_DESCRIPTOR_SCHEMA_KEY.to_string(),
|
|
43
|
+
BLOB_REF_SCHEMA_KEY.to_string(),
|
|
44
|
+
],
|
|
45
|
+
version_ids: vec![version_id.to_string()],
|
|
46
|
+
..LiveStateFilter::default()
|
|
47
|
+
},
|
|
48
|
+
..LiveStateScanRequest::default()
|
|
49
|
+
})
|
|
50
|
+
.await?;
|
|
51
|
+
Self::from_live_rows(rows)
|
|
52
|
+
}
|
|
53
|
+
|
|
54
|
+
/// Builds filesystem lookup indexes from rows that are already known to be
|
|
55
|
+
/// transaction-visible.
|
|
56
|
+
pub(crate) fn from_live_rows(rows: Vec<MaterializedLiveStateRow>) -> Result<Self, LixError> {
|
|
57
|
+
let mut visible = Self::default();
|
|
58
|
+
|
|
59
|
+
for row in rows {
|
|
60
|
+
let Some(snapshot_content) = row.snapshot_content.as_deref() else {
|
|
61
|
+
continue;
|
|
62
|
+
};
|
|
63
|
+
match row.schema_key.as_str() {
|
|
64
|
+
DIRECTORY_DESCRIPTOR_SCHEMA_KEY => {
|
|
65
|
+
let snapshot: DirectoryDescriptorSnapshot =
|
|
66
|
+
serde_json::from_str(snapshot_content).map_err(|error| {
|
|
67
|
+
LixError::new(
|
|
68
|
+
"LIX_ERROR_UNKNOWN",
|
|
69
|
+
format!("invalid lix_directory_descriptor snapshot JSON: {error}"),
|
|
70
|
+
)
|
|
71
|
+
})?;
|
|
72
|
+
let directory = VisibleDirectory {
|
|
73
|
+
id: snapshot.id,
|
|
74
|
+
parent_id: snapshot.parent_id,
|
|
75
|
+
name: snapshot.name,
|
|
76
|
+
hidden: snapshot.hidden.unwrap_or(false),
|
|
77
|
+
context: filesystem_row_context(&row)?,
|
|
78
|
+
};
|
|
79
|
+
visible
|
|
80
|
+
.directory_children_by_parent_id
|
|
81
|
+
.entry(directory.parent_id.clone())
|
|
82
|
+
.or_default()
|
|
83
|
+
.insert(directory.id.clone());
|
|
84
|
+
visible
|
|
85
|
+
.directories_by_id
|
|
86
|
+
.insert(directory.id.clone(), directory);
|
|
87
|
+
}
|
|
88
|
+
FILE_DESCRIPTOR_SCHEMA_KEY => {
|
|
89
|
+
let snapshot: FileDescriptorSnapshot = serde_json::from_str(snapshot_content)
|
|
90
|
+
.map_err(|error| {
|
|
91
|
+
LixError::new(
|
|
92
|
+
"LIX_ERROR_UNKNOWN",
|
|
93
|
+
format!("invalid lix_file_descriptor snapshot JSON: {error}"),
|
|
94
|
+
)
|
|
95
|
+
})?;
|
|
96
|
+
let file = VisibleFile {
|
|
97
|
+
id: snapshot.id,
|
|
98
|
+
directory_id: snapshot.directory_id,
|
|
99
|
+
name: snapshot.name,
|
|
100
|
+
hidden: snapshot.hidden,
|
|
101
|
+
context: filesystem_row_context(&row)?,
|
|
102
|
+
};
|
|
103
|
+
visible
|
|
104
|
+
.files_by_directory_id
|
|
105
|
+
.entry(file.directory_id.clone())
|
|
106
|
+
.or_default()
|
|
107
|
+
.insert(file.id.clone(), file);
|
|
108
|
+
}
|
|
109
|
+
BLOB_REF_SCHEMA_KEY => {
|
|
110
|
+
let snapshot: BlobRefSnapshot = serde_json::from_str(snapshot_content)
|
|
111
|
+
.map_err(|error| {
|
|
112
|
+
LixError::new(
|
|
113
|
+
"LIX_ERROR_UNKNOWN",
|
|
114
|
+
format!("invalid lix_binary_blob_ref snapshot JSON: {error}"),
|
|
115
|
+
)
|
|
116
|
+
})?;
|
|
117
|
+
visible.blob_refs_by_file_id.insert(
|
|
118
|
+
snapshot.id.clone(),
|
|
119
|
+
VisibleBlobRef {
|
|
120
|
+
file_id: snapshot.id,
|
|
121
|
+
blob_hash: snapshot.blob_hash,
|
|
122
|
+
size_bytes: snapshot.size_bytes,
|
|
123
|
+
context: filesystem_row_context(&row)?,
|
|
124
|
+
},
|
|
125
|
+
);
|
|
126
|
+
}
|
|
127
|
+
_ => {}
|
|
128
|
+
}
|
|
129
|
+
}
|
|
130
|
+
|
|
131
|
+
Ok(visible)
|
|
132
|
+
}
|
|
133
|
+
}
|
|
134
|
+
|
|
135
|
+
#[derive(Debug, Clone, PartialEq, Eq)]
|
|
136
|
+
pub(crate) struct VisibleDirectory {
|
|
137
|
+
pub(crate) id: String,
|
|
138
|
+
pub(crate) parent_id: Option<String>,
|
|
139
|
+
pub(crate) name: String,
|
|
140
|
+
pub(crate) hidden: bool,
|
|
141
|
+
pub(crate) context: FilesystemRowContext,
|
|
142
|
+
}
|
|
143
|
+
|
|
144
|
+
#[derive(Debug, Clone, PartialEq, Eq)]
|
|
145
|
+
pub(crate) struct VisibleFile {
|
|
146
|
+
pub(crate) id: String,
|
|
147
|
+
pub(crate) directory_id: Option<String>,
|
|
148
|
+
pub(crate) name: String,
|
|
149
|
+
pub(crate) hidden: bool,
|
|
150
|
+
pub(crate) context: FilesystemRowContext,
|
|
151
|
+
}
|
|
152
|
+
|
|
153
|
+
#[derive(Debug, Clone, PartialEq, Eq)]
|
|
154
|
+
pub(crate) struct VisibleBlobRef {
|
|
155
|
+
pub(crate) file_id: String,
|
|
156
|
+
pub(crate) blob_hash: String,
|
|
157
|
+
pub(crate) size_bytes: Option<u64>,
|
|
158
|
+
pub(crate) context: FilesystemRowContext,
|
|
159
|
+
}
|
|
160
|
+
|
|
161
|
+
#[derive(Debug, Deserialize)]
|
|
162
|
+
struct DirectoryDescriptorSnapshot {
|
|
163
|
+
id: String,
|
|
164
|
+
parent_id: Option<String>,
|
|
165
|
+
name: String,
|
|
166
|
+
hidden: Option<bool>,
|
|
167
|
+
}
|
|
168
|
+
|
|
169
|
+
#[derive(Debug, Deserialize)]
|
|
170
|
+
struct FileDescriptorSnapshot {
|
|
171
|
+
id: String,
|
|
172
|
+
directory_id: Option<String>,
|
|
173
|
+
name: String,
|
|
174
|
+
hidden: bool,
|
|
175
|
+
}
|
|
176
|
+
|
|
177
|
+
#[derive(Debug, Deserialize)]
|
|
178
|
+
struct BlobRefSnapshot {
|
|
179
|
+
id: String,
|
|
180
|
+
blob_hash: String,
|
|
181
|
+
size_bytes: Option<u64>,
|
|
182
|
+
}
|
|
183
|
+
|
|
184
|
+
fn filesystem_row_context(
|
|
185
|
+
row: &MaterializedLiveStateRow,
|
|
186
|
+
) -> Result<FilesystemRowContext, LixError> {
|
|
187
|
+
Ok(FilesystemRowContext {
|
|
188
|
+
version_id: row.version_id.clone(),
|
|
189
|
+
global: row.global,
|
|
190
|
+
untracked: row.untracked,
|
|
191
|
+
file_id: row.file_id.clone(),
|
|
192
|
+
metadata: row
|
|
193
|
+
.metadata
|
|
194
|
+
.as_deref()
|
|
195
|
+
.map(|metadata| {
|
|
196
|
+
crate::parse_row_metadata_value(metadata, "filesystem row metadata").and_then(
|
|
197
|
+
|metadata| {
|
|
198
|
+
crate::transaction::types::TransactionJson::from_value(
|
|
199
|
+
metadata,
|
|
200
|
+
"filesystem row metadata",
|
|
201
|
+
)
|
|
202
|
+
},
|
|
203
|
+
)
|
|
204
|
+
})
|
|
205
|
+
.transpose()?,
|
|
206
|
+
})
|
|
207
|
+
}
|
|
208
|
+
|
|
209
|
+
#[cfg(test)]
|
|
210
|
+
mod tests {
|
|
211
|
+
use async_trait::async_trait;
|
|
212
|
+
|
|
213
|
+
use crate::live_state::MaterializedLiveStateRow;
|
|
214
|
+
use crate::live_state::{LiveStateReader, LiveStateRowRequest, LiveStateScanRequest};
|
|
215
|
+
use crate::LixError;
|
|
216
|
+
|
|
217
|
+
use super::{
|
|
218
|
+
VisibleFilesystem, BLOB_REF_SCHEMA_KEY, DIRECTORY_DESCRIPTOR_SCHEMA_KEY,
|
|
219
|
+
FILE_DESCRIPTOR_SCHEMA_KEY,
|
|
220
|
+
};
|
|
221
|
+
|
|
222
|
+
#[tokio::test]
|
|
223
|
+
async fn nested_directories_resolve_correctly() {
|
|
224
|
+
let filesystem = VisibleFilesystem::load(
|
|
225
|
+
live_state(vec![
|
|
226
|
+
directory_row(
|
|
227
|
+
"dir-docs",
|
|
228
|
+
r#"{"id":"dir-docs","parent_id":null,"name":"docs","hidden":false}"#,
|
|
229
|
+
),
|
|
230
|
+
directory_row(
|
|
231
|
+
"dir-guides",
|
|
232
|
+
r#"{"id":"dir-guides","parent_id":"dir-docs","name":"guides","hidden":false}"#,
|
|
233
|
+
),
|
|
234
|
+
]),
|
|
235
|
+
"version-a",
|
|
236
|
+
)
|
|
237
|
+
.await
|
|
238
|
+
.expect("visible filesystem should load");
|
|
239
|
+
|
|
240
|
+
assert_eq!(
|
|
241
|
+
filesystem
|
|
242
|
+
.directories_by_id
|
|
243
|
+
.get("dir-guides")
|
|
244
|
+
.and_then(|directory| directory.parent_id.as_deref()),
|
|
245
|
+
Some("dir-docs")
|
|
246
|
+
);
|
|
247
|
+
assert!(filesystem
|
|
248
|
+
.directory_children_by_parent_id
|
|
249
|
+
.get(&None)
|
|
250
|
+
.is_some_and(|children| children.contains("dir-docs")));
|
|
251
|
+
assert!(filesystem
|
|
252
|
+
.directory_children_by_parent_id
|
|
253
|
+
.get(&Some("dir-docs".to_string()))
|
|
254
|
+
.is_some_and(|children| children.contains("dir-guides")));
|
|
255
|
+
}
|
|
256
|
+
|
|
257
|
+
#[tokio::test]
|
|
258
|
+
async fn files_attach_to_directory_ids() {
|
|
259
|
+
let filesystem = VisibleFilesystem::load(
|
|
260
|
+
live_state(vec![file_row(
|
|
261
|
+
"file-readme",
|
|
262
|
+
r#"{"id":"file-readme","directory_id":"dir-guides","name":"readme.md","hidden":false}"#,
|
|
263
|
+
)]),
|
|
264
|
+
"version-a",
|
|
265
|
+
)
|
|
266
|
+
.await
|
|
267
|
+
.expect("visible filesystem should load");
|
|
268
|
+
|
|
269
|
+
let files = filesystem
|
|
270
|
+
.files_by_directory_id
|
|
271
|
+
.get(&Some("dir-guides".to_string()))
|
|
272
|
+
.expect("directory should have attached files");
|
|
273
|
+
let file = files
|
|
274
|
+
.get("file-readme")
|
|
275
|
+
.expect("file should be indexed by id inside directory");
|
|
276
|
+
assert_eq!(file.name, "readme.md");
|
|
277
|
+
}
|
|
278
|
+
|
|
279
|
+
#[tokio::test]
|
|
280
|
+
async fn blob_refs_attach_to_file_ids() {
|
|
281
|
+
let filesystem = VisibleFilesystem::load(
|
|
282
|
+
live_state(vec![blob_ref_row(
|
|
283
|
+
"file-readme",
|
|
284
|
+
r#"{"id":"file-readme","blob_hash":"abc123","size_bytes":5}"#,
|
|
285
|
+
)]),
|
|
286
|
+
"version-a",
|
|
287
|
+
)
|
|
288
|
+
.await
|
|
289
|
+
.expect("visible filesystem should load");
|
|
290
|
+
|
|
291
|
+
let blob_ref = filesystem
|
|
292
|
+
.blob_refs_by_file_id
|
|
293
|
+
.get("file-readme")
|
|
294
|
+
.expect("blob ref should be indexed by file id");
|
|
295
|
+
assert_eq!(blob_ref.blob_hash, "abc123");
|
|
296
|
+
assert_eq!(blob_ref.size_bytes, Some(5));
|
|
297
|
+
}
|
|
298
|
+
|
|
299
|
+
fn live_state(rows: Vec<MaterializedLiveStateRow>) -> std::sync::Arc<dyn LiveStateReader> {
|
|
300
|
+
std::sync::Arc::new(RowsLiveStateReader { rows })
|
|
301
|
+
}
|
|
302
|
+
|
|
303
|
+
struct RowsLiveStateReader {
|
|
304
|
+
rows: Vec<MaterializedLiveStateRow>,
|
|
305
|
+
}
|
|
306
|
+
|
|
307
|
+
#[async_trait]
|
|
308
|
+
impl LiveStateReader for RowsLiveStateReader {
|
|
309
|
+
async fn scan_rows(
|
|
310
|
+
&self,
|
|
311
|
+
request: &LiveStateScanRequest,
|
|
312
|
+
) -> Result<Vec<MaterializedLiveStateRow>, LixError> {
|
|
313
|
+
Ok(self
|
|
314
|
+
.rows
|
|
315
|
+
.iter()
|
|
316
|
+
.filter(|row| {
|
|
317
|
+
(request.filter.schema_keys.is_empty()
|
|
318
|
+
|| request.filter.schema_keys.contains(&row.schema_key))
|
|
319
|
+
&& (request.filter.version_ids.is_empty()
|
|
320
|
+
|| request.filter.version_ids.contains(&row.version_id))
|
|
321
|
+
})
|
|
322
|
+
.cloned()
|
|
323
|
+
.collect())
|
|
324
|
+
}
|
|
325
|
+
|
|
326
|
+
async fn load_row(
|
|
327
|
+
&self,
|
|
328
|
+
_request: &LiveStateRowRequest,
|
|
329
|
+
) -> Result<Option<MaterializedLiveStateRow>, LixError> {
|
|
330
|
+
Ok(None)
|
|
331
|
+
}
|
|
332
|
+
}
|
|
333
|
+
|
|
334
|
+
fn directory_row(entity_id: &str, snapshot_content: &str) -> MaterializedLiveStateRow {
|
|
335
|
+
live_row(
|
|
336
|
+
entity_id,
|
|
337
|
+
DIRECTORY_DESCRIPTOR_SCHEMA_KEY,
|
|
338
|
+
None,
|
|
339
|
+
snapshot_content,
|
|
340
|
+
)
|
|
341
|
+
}
|
|
342
|
+
|
|
343
|
+
fn file_row(entity_id: &str, snapshot_content: &str) -> MaterializedLiveStateRow {
|
|
344
|
+
live_row(
|
|
345
|
+
entity_id,
|
|
346
|
+
FILE_DESCRIPTOR_SCHEMA_KEY,
|
|
347
|
+
None,
|
|
348
|
+
snapshot_content,
|
|
349
|
+
)
|
|
350
|
+
}
|
|
351
|
+
|
|
352
|
+
fn blob_ref_row(entity_id: &str, snapshot_content: &str) -> MaterializedLiveStateRow {
|
|
353
|
+
live_row(
|
|
354
|
+
entity_id,
|
|
355
|
+
BLOB_REF_SCHEMA_KEY,
|
|
356
|
+
Some(entity_id.to_string()),
|
|
357
|
+
snapshot_content,
|
|
358
|
+
)
|
|
359
|
+
}
|
|
360
|
+
|
|
361
|
+
fn live_row(
|
|
362
|
+
entity_id: &str,
|
|
363
|
+
schema_key: &str,
|
|
364
|
+
file_id: Option<String>,
|
|
365
|
+
snapshot_content: &str,
|
|
366
|
+
) -> MaterializedLiveStateRow {
|
|
367
|
+
MaterializedLiveStateRow {
|
|
368
|
+
entity_id: crate::entity_identity::EntityIdentity::single(entity_id),
|
|
369
|
+
schema_key: schema_key.to_string(),
|
|
370
|
+
file_id,
|
|
371
|
+
snapshot_content: Some(snapshot_content.to_string()),
|
|
372
|
+
metadata: None,
|
|
373
|
+
deleted: false,
|
|
374
|
+
version_id: "version-a".to_string(),
|
|
375
|
+
change_id: Some(format!("change-{entity_id}")),
|
|
376
|
+
commit_id: Some(format!("commit-{entity_id}")),
|
|
377
|
+
global: false,
|
|
378
|
+
untracked: false,
|
|
379
|
+
created_at: "2026-04-23T00:00:00Z".to_string(),
|
|
380
|
+
updated_at: "2026-04-23T01:00:00Z".to_string(),
|
|
381
|
+
}
|
|
382
|
+
}
|
|
383
|
+
}
|
|
@@ -0,0 +1,56 @@
|
|
|
1
|
+
use serde_json::Value as JsonValue;
|
|
2
|
+
|
|
3
|
+
use crate::entity_identity::EntityIdentity;
|
|
4
|
+
use crate::LixError;
|
|
5
|
+
|
|
6
|
+
/// Shared projection contract for typed history views.
|
|
7
|
+
///
|
|
8
|
+
/// On tombstone rows (`snapshot_content IS NULL`), identity columns survive by
|
|
9
|
+
/// projecting from canonical entity identity. Non-identity columns must remain
|
|
10
|
+
/// NULL because there is no snapshot to project payload from.
|
|
11
|
+
pub(crate) enum HistoryIdentityProjection<'a> {
|
|
12
|
+
PrimaryKeyPaths(&'a [Vec<String>]),
|
|
13
|
+
SingleColumn { column: &'a str },
|
|
14
|
+
}
|
|
15
|
+
|
|
16
|
+
pub(crate) fn tombstone_identity_column_value(
|
|
17
|
+
column_name: &str,
|
|
18
|
+
entity_id: &str,
|
|
19
|
+
projection: HistoryIdentityProjection<'_>,
|
|
20
|
+
) -> Result<Option<JsonValue>, LixError> {
|
|
21
|
+
match projection {
|
|
22
|
+
HistoryIdentityProjection::SingleColumn { column } => {
|
|
23
|
+
if column_name == column {
|
|
24
|
+
Ok(Some(JsonValue::String(entity_id.to_string())))
|
|
25
|
+
} else {
|
|
26
|
+
Ok(None)
|
|
27
|
+
}
|
|
28
|
+
}
|
|
29
|
+
HistoryIdentityProjection::PrimaryKeyPaths(primary_key_paths) => {
|
|
30
|
+
primary_key_tombstone_value(column_name, entity_id, primary_key_paths)
|
|
31
|
+
}
|
|
32
|
+
}
|
|
33
|
+
}
|
|
34
|
+
|
|
35
|
+
fn primary_key_tombstone_value(
|
|
36
|
+
column_name: &str,
|
|
37
|
+
entity_id: &str,
|
|
38
|
+
primary_key_paths: &[Vec<String>],
|
|
39
|
+
) -> Result<Option<JsonValue>, LixError> {
|
|
40
|
+
let Some(part_index) = primary_key_paths
|
|
41
|
+
.iter()
|
|
42
|
+
.position(|path| path.as_slice() == [column_name])
|
|
43
|
+
else {
|
|
44
|
+
return Ok(None);
|
|
45
|
+
};
|
|
46
|
+
|
|
47
|
+
let identity = EntityIdentity::from_json_array_text(entity_id).map_err(|error| {
|
|
48
|
+
LixError::unknown(format!(
|
|
49
|
+
"failed to decode history tombstone entity identity: {error}"
|
|
50
|
+
))
|
|
51
|
+
})?;
|
|
52
|
+
Ok(identity
|
|
53
|
+
.parts
|
|
54
|
+
.get(part_index)
|
|
55
|
+
.map(|part| JsonValue::String(part.clone())))
|
|
56
|
+
}
|