@lix-js/sdk 0.6.0-preview.2 → 0.6.0-preview.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (169) hide show
  1. package/SKILL.md +46 -8
  2. package/dist/engine-wasm/wasm/lix_engine.d.ts +25 -1
  3. package/dist/engine-wasm/wasm/lix_engine.js +60 -2
  4. package/dist/engine-wasm/wasm/lix_engine.wasm +0 -0
  5. package/dist/engine-wasm/wasm/lix_engine.wasm.d.ts +5 -0
  6. package/dist/generated/builtin-schemas.d.ts +87 -162
  7. package/dist/generated/builtin-schemas.js +139 -236
  8. package/dist/open-lix.d.ts +10 -3
  9. package/dist/open-lix.js +39 -0
  10. package/dist-engine-src/src/binary_cas/types.rs +0 -6
  11. package/dist-engine-src/src/catalog/context.rs +412 -0
  12. package/dist-engine-src/src/catalog/mod.rs +10 -0
  13. package/dist-engine-src/src/catalog/schema.rs +4 -0
  14. package/dist-engine-src/src/catalog/snapshot.rs +1114 -0
  15. package/dist-engine-src/src/cel/mod.rs +1 -1
  16. package/dist-engine-src/src/cel/provider.rs +1 -1
  17. package/dist-engine-src/src/commit_graph/context.rs +328 -1015
  18. package/dist-engine-src/src/commit_graph/mod.rs +2 -3
  19. package/dist-engine-src/src/commit_graph/types.rs +7 -43
  20. package/dist-engine-src/src/commit_graph/walker.rs +57 -81
  21. package/dist-engine-src/src/commit_store/codec.rs +887 -0
  22. package/dist-engine-src/src/commit_store/context.rs +944 -0
  23. package/dist-engine-src/src/commit_store/materialization.rs +84 -0
  24. package/dist-engine-src/src/commit_store/mod.rs +16 -0
  25. package/dist-engine-src/src/commit_store/storage.rs +600 -0
  26. package/dist-engine-src/src/commit_store/types.rs +215 -0
  27. package/dist-engine-src/src/common/identity.rs +15 -5
  28. package/dist-engine-src/src/common/json_pointer.rs +67 -0
  29. package/dist-engine-src/src/common/metadata.rs +17 -12
  30. package/dist-engine-src/src/common/mod.rs +5 -5
  31. package/dist-engine-src/src/domain.rs +324 -0
  32. package/dist-engine-src/src/engine.rs +29 -43
  33. package/dist-engine-src/src/entity_identity.rs +238 -118
  34. package/dist-engine-src/src/functions/context.rs +17 -52
  35. package/dist-engine-src/src/functions/deterministic.rs +1 -1
  36. package/dist-engine-src/src/functions/mod.rs +1 -1
  37. package/dist-engine-src/src/functions/provider.rs +4 -4
  38. package/dist-engine-src/src/functions/state.rs +39 -66
  39. package/dist-engine-src/src/functions/types.rs +1 -1
  40. package/dist-engine-src/src/init.rs +204 -151
  41. package/dist-engine-src/src/json_store/context.rs +354 -60
  42. package/dist-engine-src/src/json_store/encoded.rs +6 -6
  43. package/dist-engine-src/src/json_store/mod.rs +4 -1
  44. package/dist-engine-src/src/json_store/store.rs +884 -11
  45. package/dist-engine-src/src/json_store/types.rs +166 -1
  46. package/dist-engine-src/src/lib.rs +11 -10
  47. package/dist-engine-src/src/live_state/context.rs +608 -830
  48. package/dist-engine-src/src/live_state/mod.rs +3 -3
  49. package/dist-engine-src/src/live_state/overlay.rs +7 -7
  50. package/dist-engine-src/src/live_state/reader.rs +5 -5
  51. package/dist-engine-src/src/live_state/types.rs +19 -36
  52. package/dist-engine-src/src/live_state/visibility.rs +19 -14
  53. package/dist-engine-src/src/plugin/archive.rs +3 -6
  54. package/dist-engine-src/src/plugin/install.rs +0 -18
  55. package/dist-engine-src/src/plugin/plugin_manifest.json +0 -1
  56. package/dist-engine-src/src/schema/annotations/defaults.rs +2 -7
  57. package/dist-engine-src/src/schema/builtin/lix_account.json +0 -1
  58. package/dist-engine-src/src/schema/builtin/lix_active_account.json +0 -1
  59. package/dist-engine-src/src/schema/builtin/lix_binary_blob_ref.json +0 -1
  60. package/dist-engine-src/src/schema/builtin/lix_change.json +11 -10
  61. package/dist-engine-src/src/schema/builtin/lix_change_author.json +0 -1
  62. package/dist-engine-src/src/schema/builtin/lix_commit.json +8 -46
  63. package/dist-engine-src/src/schema/builtin/lix_commit_edge.json +29 -22
  64. package/dist-engine-src/src/schema/builtin/lix_directory_descriptor.json +0 -1
  65. package/dist-engine-src/src/schema/builtin/lix_file_descriptor.json +0 -1
  66. package/dist-engine-src/src/schema/builtin/lix_key_value.json +0 -1
  67. package/dist-engine-src/src/schema/builtin/lix_label.json +10 -3
  68. package/dist-engine-src/src/schema/builtin/lix_label_assignment.json +74 -0
  69. package/dist-engine-src/src/schema/builtin/lix_registered_schema.json +2 -8
  70. package/dist-engine-src/src/schema/builtin/lix_version_descriptor.json +0 -1
  71. package/dist-engine-src/src/schema/builtin/lix_version_ref.json +0 -1
  72. package/dist-engine-src/src/schema/builtin/mod.rs +10 -59
  73. package/dist-engine-src/src/schema/compatibility.rs +787 -0
  74. package/dist-engine-src/src/schema/definition.json +47 -17
  75. package/dist-engine-src/src/schema/definition.rs +202 -96
  76. package/dist-engine-src/src/schema/key.rs +9 -77
  77. package/dist-engine-src/src/schema/mod.rs +4 -4
  78. package/dist-engine-src/src/schema/tests.rs +133 -92
  79. package/dist-engine-src/src/session/context.rs +86 -48
  80. package/dist-engine-src/src/session/create_version.rs +22 -14
  81. package/dist-engine-src/src/session/execute.rs +117 -23
  82. package/dist-engine-src/src/session/merge/apply.rs +4 -4
  83. package/dist-engine-src/src/session/merge/conflicts.rs +3 -2
  84. package/dist-engine-src/src/session/merge/stats.rs +1 -1
  85. package/dist-engine-src/src/session/merge/version.rs +35 -45
  86. package/dist-engine-src/src/session/mod.rs +9 -7
  87. package/dist-engine-src/src/session/optimization9_sql2_bench.rs +100 -0
  88. package/dist-engine-src/src/session/switch_version.rs +17 -28
  89. package/dist-engine-src/src/session/transaction.rs +76 -0
  90. package/dist-engine-src/src/sql2/change_provider.rs +14 -20
  91. package/dist-engine-src/src/sql2/classify.rs +75 -48
  92. package/dist-engine-src/src/sql2/context.rs +22 -18
  93. package/dist-engine-src/src/sql2/directory_history_provider.rs +28 -20
  94. package/dist-engine-src/src/sql2/directory_provider.rs +131 -83
  95. package/dist-engine-src/src/sql2/entity_history_provider.rs +10 -14
  96. package/dist-engine-src/src/sql2/entity_provider.rs +680 -169
  97. package/dist-engine-src/src/sql2/error.rs +24 -5
  98. package/dist-engine-src/src/sql2/execute.rs +426 -272
  99. package/dist-engine-src/src/sql2/file_history_provider.rs +29 -21
  100. package/dist-engine-src/src/sql2/file_provider.rs +533 -108
  101. package/dist-engine-src/src/sql2/filesystem_planner.rs +58 -94
  102. package/dist-engine-src/src/sql2/filesystem_visibility.rs +37 -23
  103. package/dist-engine-src/src/sql2/history_projection.rs +3 -27
  104. package/dist-engine-src/src/sql2/history_provider.rs +11 -17
  105. package/dist-engine-src/src/sql2/history_route.rs +22 -8
  106. package/dist-engine-src/src/sql2/lix_state_provider.rs +178 -96
  107. package/dist-engine-src/src/sql2/mod.rs +8 -4
  108. package/dist-engine-src/src/sql2/predicate_typecheck.rs +246 -0
  109. package/dist-engine-src/src/sql2/public_bind/assignment.rs +46 -0
  110. package/dist-engine-src/src/sql2/public_bind/capability.rs +41 -0
  111. package/dist-engine-src/src/sql2/public_bind/dml.rs +172 -0
  112. package/dist-engine-src/src/sql2/public_bind/mod.rs +26 -0
  113. package/dist-engine-src/src/sql2/public_bind/table.rs +168 -0
  114. package/dist-engine-src/src/sql2/read_only.rs +10 -12
  115. package/dist-engine-src/src/sql2/session.rs +7 -10
  116. package/dist-engine-src/src/sql2/udfs/lix_timestamp.rs +76 -0
  117. package/dist-engine-src/src/sql2/udfs/mod.rs +8 -1
  118. package/dist-engine-src/src/sql2/udfs/public_call.rs +238 -0
  119. package/dist-engine-src/src/sql2/version_provider.rs +46 -31
  120. package/dist-engine-src/src/sql2/version_scope.rs +4 -4
  121. package/dist-engine-src/src/storage_bench.rs +1782 -325
  122. package/dist-engine-src/src/test_support.rs +183 -36
  123. package/dist-engine-src/src/tracked_state/by_file_index.rs +20 -24
  124. package/dist-engine-src/src/tracked_state/codec.rs +1519 -181
  125. package/dist-engine-src/src/tracked_state/context.rs +1155 -271
  126. package/dist-engine-src/src/tracked_state/diff.rs +249 -57
  127. package/dist-engine-src/src/tracked_state/materialization.rs +365 -103
  128. package/dist-engine-src/src/tracked_state/materializer.rs +488 -0
  129. package/dist-engine-src/src/tracked_state/merge.rs +37 -19
  130. package/dist-engine-src/src/tracked_state/mod.rs +8 -7
  131. package/dist-engine-src/src/tracked_state/storage.rs +138 -6
  132. package/dist-engine-src/src/tracked_state/tree.rs +695 -252
  133. package/dist-engine-src/src/tracked_state/types.rs +176 -6
  134. package/dist-engine-src/src/transaction/commit.rs +695 -435
  135. package/dist-engine-src/src/transaction/context.rs +551 -310
  136. package/dist-engine-src/src/transaction/live_state_overlay.rs +9 -8
  137. package/dist-engine-src/src/transaction/mod.rs +2 -0
  138. package/dist-engine-src/src/transaction/normalization.rs +311 -447
  139. package/dist-engine-src/src/transaction/prep.rs +37 -0
  140. package/dist-engine-src/src/transaction/schema_resolver.rs +93 -71
  141. package/dist-engine-src/src/transaction/staging.rs +701 -406
  142. package/dist-engine-src/src/transaction/types.rs +231 -122
  143. package/dist-engine-src/src/transaction/validation.rs +2717 -1698
  144. package/dist-engine-src/src/untracked_state/codec.rs +40 -96
  145. package/dist-engine-src/src/untracked_state/context.rs +21 -5
  146. package/dist-engine-src/src/untracked_state/materialization.rs +10 -104
  147. package/dist-engine-src/src/untracked_state/mod.rs +3 -5
  148. package/dist-engine-src/src/untracked_state/storage.rs +105 -57
  149. package/dist-engine-src/src/untracked_state/types.rs +63 -13
  150. package/dist-engine-src/src/version/context.rs +1 -13
  151. package/dist-engine-src/src/version/lifecycle.rs +221 -0
  152. package/dist-engine-src/src/version/mod.rs +3 -2
  153. package/dist-engine-src/src/version/refs.rs +12 -103
  154. package/dist-engine-src/src/version/stage_rows.rs +15 -19
  155. package/package.json +1 -1
  156. package/dist-engine-src/src/changelog/codec.rs +0 -321
  157. package/dist-engine-src/src/changelog/context.rs +0 -92
  158. package/dist-engine-src/src/changelog/materialization.rs +0 -121
  159. package/dist-engine-src/src/changelog/mod.rs +0 -13
  160. package/dist-engine-src/src/changelog/reader.rs +0 -20
  161. package/dist-engine-src/src/changelog/storage.rs +0 -220
  162. package/dist-engine-src/src/changelog/types.rs +0 -38
  163. package/dist-engine-src/src/schema/builtin/lix_change_set.json +0 -18
  164. package/dist-engine-src/src/schema/builtin/lix_change_set_element.json +0 -75
  165. package/dist-engine-src/src/schema/builtin/lix_entity_label.json +0 -63
  166. package/dist-engine-src/src/schema_registry.rs +0 -294
  167. package/dist-engine-src/src/sql2/commit_derived_provider.rs +0 -591
  168. package/dist-engine-src/src/tracked_state/rebuild.rs +0 -771
  169. package/dist-engine-src/src/tracked_state/tree_types.rs +0 -176
@@ -0,0 +1,168 @@
1
+ use std::collections::{BTreeMap, BTreeSet};
2
+
3
+ use serde_json::Value as JsonValue;
4
+
5
+ use crate::schema::schema_key_from_definition;
6
+ use crate::LixError;
7
+
8
+ #[derive(Clone, Copy, Debug, Eq, PartialEq)]
9
+ pub(crate) enum Capability {
10
+ Allowed,
11
+ ReadOnly(&'static str),
12
+ Unsupported(&'static str),
13
+ }
14
+
15
+ #[derive(Clone, Debug)]
16
+ pub(crate) struct ColumnContract {
17
+ pub(crate) writable: bool,
18
+ }
19
+
20
+ #[derive(Clone, Debug)]
21
+ pub(crate) struct TableContract {
22
+ pub(crate) insert: Capability,
23
+ pub(crate) update: Capability,
24
+ pub(crate) delete: Capability,
25
+ pub(crate) columns: BTreeMap<String, ColumnContract>,
26
+ }
27
+
28
+ impl TableContract {
29
+ pub(crate) fn operation(&self, operation: super::DmlOperation) -> Capability {
30
+ match operation {
31
+ super::DmlOperation::Insert => self.insert,
32
+ super::DmlOperation::Update => self.update,
33
+ super::DmlOperation::Delete => self.delete,
34
+ }
35
+ }
36
+
37
+ pub(crate) fn column(&self, column: &str) -> Option<&ColumnContract> {
38
+ self.columns.get(column)
39
+ }
40
+ }
41
+
42
+ #[derive(Clone, Debug, Eq, PartialEq, Ord, PartialOrd)]
43
+ pub(crate) struct PublicSurface {
44
+ name: String,
45
+ }
46
+
47
+ impl PublicSurface {
48
+ pub(crate) fn named(name: impl Into<String>) -> Self {
49
+ Self {
50
+ name: name.into().to_ascii_lowercase(),
51
+ }
52
+ }
53
+
54
+ pub(crate) fn name(&self) -> &str {
55
+ &self.name
56
+ }
57
+ }
58
+
59
+ #[derive(Clone, Debug)]
60
+ pub(crate) struct PublicTableContracts {
61
+ contracts: BTreeMap<String, TableContract>,
62
+ }
63
+
64
+ impl PublicTableContracts {
65
+ pub(crate) fn new(visible_schemas: &[JsonValue]) -> Result<Self, LixError> {
66
+ let mut contracts = builtin_contracts();
67
+ for schema in visible_schemas {
68
+ let schema_key = schema_key_from_definition(schema)?.schema_key;
69
+ contracts.insert(
70
+ format!("{}_history", schema_key.to_ascii_lowercase()),
71
+ history_contract(),
72
+ );
73
+ }
74
+ Ok(Self { contracts })
75
+ }
76
+
77
+ pub(crate) fn get(&self, surface: &PublicSurface) -> Option<&TableContract> {
78
+ self.contracts.get(surface.name())
79
+ }
80
+ }
81
+
82
+ fn builtin_contracts() -> BTreeMap<String, TableContract> {
83
+ let mut contracts = BTreeMap::new();
84
+
85
+ for table in [
86
+ "lix_change",
87
+ "lix_commit",
88
+ "lix_commit_by_version",
89
+ "lix_commit_edge",
90
+ "lix_commit_edge_by_version",
91
+ "lix_change_set",
92
+ "lix_change_set_by_version",
93
+ "lix_change_set_element",
94
+ "lix_change_set_element_by_version",
95
+ ] {
96
+ contracts.insert(table.to_string(), commit_graph_contract());
97
+ }
98
+
99
+ for table in [
100
+ "lix_state_history",
101
+ "lix_file_history",
102
+ "lix_directory_history",
103
+ ] {
104
+ contracts.insert(table.to_string(), history_contract());
105
+ }
106
+
107
+ contracts.insert(
108
+ "lix_registered_schema".to_string(),
109
+ TableContract {
110
+ insert: Capability::Allowed,
111
+ update: Capability::Allowed,
112
+ delete: Capability::Unsupported(
113
+ "lix_registered_schema deletion is not supported; register an amended schema instead",
114
+ ),
115
+ columns: columns(&["value", "lixcol_metadata", "lixcol_global", "lixcol_untracked"]),
116
+ },
117
+ );
118
+
119
+ contracts.insert(
120
+ "lix_key_value".to_string(),
121
+ TableContract {
122
+ insert: Capability::Allowed,
123
+ update: Capability::Allowed,
124
+ delete: Capability::Allowed,
125
+ columns: columns(&["key", "value", "lixcol_metadata"]),
126
+ },
127
+ );
128
+
129
+ contracts
130
+ }
131
+
132
+ fn commit_graph_contract() -> TableContract {
133
+ TableContract {
134
+ insert: Capability::ReadOnly(
135
+ "Commit graph and changelog surfaces are read-only; Lix creates them when transactions commit.",
136
+ ),
137
+ update: Capability::ReadOnly(
138
+ "Commit graph and changelog surfaces are read-only; Lix creates them when transactions commit.",
139
+ ),
140
+ delete: Capability::ReadOnly(
141
+ "Commit graph and changelog surfaces are read-only; Lix creates them when transactions commit.",
142
+ ),
143
+ columns: BTreeMap::new(),
144
+ }
145
+ }
146
+
147
+ fn history_contract() -> TableContract {
148
+ TableContract {
149
+ insert: Capability::ReadOnly(
150
+ "History views are query-only; write to the live surface such as lix_state, lix_file, lix_directory, or the typed entity table.",
151
+ ),
152
+ update: Capability::ReadOnly(
153
+ "History views are query-only; write to the live surface such as lix_state, lix_file, lix_directory, or the typed entity table.",
154
+ ),
155
+ delete: Capability::ReadOnly(
156
+ "History views are query-only; write to the live surface such as lix_state, lix_file, lix_directory, or the typed entity table.",
157
+ ),
158
+ columns: BTreeMap::new(),
159
+ }
160
+ }
161
+
162
+ fn columns(writable: &[&str]) -> BTreeMap<String, ColumnContract> {
163
+ let writable = writable.iter().copied().collect::<BTreeSet<_>>();
164
+ writable
165
+ .into_iter()
166
+ .map(|column| (column.to_string(), ColumnContract { writable: true }))
167
+ .collect()
168
+ }
@@ -1,42 +1,42 @@
1
1
  use datafusion::error::DataFusionError;
2
2
 
3
- use crate::transaction::types::StageRow;
3
+ use crate::transaction::types::TransactionWriteRow;
4
4
  use crate::LixError;
5
5
 
6
6
  pub(crate) fn reject_read_only_entity_surface(
7
7
  schema_key: &str,
8
- operation: &str,
8
+ action: &str,
9
9
  ) -> Result<(), DataFusionError> {
10
10
  if schema_key == "lix_directory_descriptor" {
11
11
  return Err(read_only_error(
12
- operation,
12
+ action,
13
13
  schema_key,
14
14
  "Use the writable lix_directory surface to create, update, or delete directories.",
15
15
  ));
16
16
  }
17
17
  if let Some(message) = read_only_schema_message(schema_key) {
18
- return Err(read_only_error(operation, schema_key, message));
18
+ return Err(read_only_error(action, schema_key, message));
19
19
  }
20
20
  Ok(())
21
21
  }
22
22
 
23
23
  pub(crate) fn reject_read_only_stage_rows(
24
- rows: &[StageRow],
25
- operation: &str,
24
+ rows: &[TransactionWriteRow],
25
+ action: &str,
26
26
  ) -> Result<(), DataFusionError> {
27
27
  for row in rows {
28
28
  if let Some(message) = read_only_schema_message(&row.schema_key) {
29
- return Err(read_only_error(operation, &row.schema_key, message));
29
+ return Err(read_only_error(action, &row.schema_key, message));
30
30
  }
31
31
  }
32
32
  Ok(())
33
33
  }
34
34
 
35
- fn read_only_error(operation: &str, schema_key: &str, message: &'static str) -> DataFusionError {
35
+ fn read_only_error(action: &str, schema_key: &str, message: &'static str) -> DataFusionError {
36
36
  super::error::lix_error_to_datafusion_error(
37
37
  LixError::new(
38
38
  LixError::CODE_READ_ONLY,
39
- format!("{operation} cannot write read-only surface '{schema_key}'"),
39
+ format!("{action} cannot write read-only surface '{schema_key}'"),
40
40
  )
41
41
  .with_hint(message),
42
42
  )
@@ -55,9 +55,7 @@ fn read_only_schema_message(schema_key: &str) -> Option<&'static str> {
55
55
  }
56
56
  "lix_commit"
57
57
  | "lix_commit_edge"
58
- | "lix_change"
59
- | "lix_change_set"
60
- | "lix_change_set_element" => Some(
58
+ | "lix_change" => Some(
61
59
  "Commit graph and changelog surfaces are read-only; Lix creates them when transactions commit.",
62
60
  ),
63
61
  _ => None,
@@ -5,7 +5,6 @@ use datafusion::prelude::{SessionConfig, SessionContext};
5
5
  use crate::LixError;
6
6
 
7
7
  use super::change_provider::register_lix_change_provider;
8
- use super::commit_derived_provider::register_commit_derived_providers;
9
8
  use super::directory_history_provider::register_lix_directory_history_provider;
10
9
  use super::directory_provider::{
11
10
  register_lix_directory_providers, register_lix_directory_write_providers,
@@ -37,22 +36,20 @@ pub(crate) async fn build_read_session(
37
36
  )
38
37
  .await?;
39
38
  register_lix_version_provider(&session, ctx.live_state(), Arc::clone(&version_ref)).await?;
40
- let changelog_query_source = ctx.changelog_query_source();
41
- register_lix_change_provider(&session, changelog_query_source.clone()).await?;
42
- let commit_graph = ctx.commit_graph();
43
- register_commit_derived_providers(&session, commit_graph, Arc::clone(&version_ref)).await?;
39
+ let commit_store_query_source = ctx.commit_store_query_source();
40
+ register_lix_change_provider(&session, commit_store_query_source.clone()).await?;
44
41
  let state_history_commit_graph = ctx.commit_graph();
45
42
  register_history_providers(
46
43
  &session,
47
44
  state_history_commit_graph,
48
- changelog_query_source.clone(),
45
+ commit_store_query_source.clone(),
49
46
  )
50
47
  .await?;
51
48
  let file_history_commit_graph = ctx.commit_graph();
52
49
  register_lix_file_history_provider(
53
50
  &session,
54
51
  file_history_commit_graph,
55
- changelog_query_source.clone(),
52
+ commit_store_query_source.clone(),
56
53
  ctx.blob_reader(),
57
54
  )
58
55
  .await?;
@@ -60,7 +57,7 @@ pub(crate) async fn build_read_session(
60
57
  register_lix_directory_history_provider(
61
58
  &session,
62
59
  directory_history_commit_graph,
63
- changelog_query_source.clone(),
60
+ commit_store_query_source.clone(),
64
61
  )
65
62
  .await?;
66
63
  let entity_commit_graph = Arc::new(tokio::sync::Mutex::new(ctx.commit_graph()));
@@ -87,7 +84,7 @@ pub(crate) async fn build_read_session(
87
84
  ctx.live_state(),
88
85
  Arc::clone(&version_ref),
89
86
  entity_commit_graph,
90
- changelog_query_source,
87
+ commit_store_query_source,
91
88
  &ctx.list_visible_schemas()?,
92
89
  )
93
90
  .await?;
@@ -120,7 +117,7 @@ pub(crate) async fn build_write_session(
120
117
  Ok(session)
121
118
  }
122
119
 
123
- fn new_sql_session_context() -> SessionContext {
120
+ pub(crate) fn new_sql_session_context() -> SessionContext {
124
121
  SessionContext::new_with_config(
125
122
  SessionConfig::new()
126
123
  .with_information_schema(true)
@@ -0,0 +1,76 @@
1
+ use std::any::Any;
2
+
3
+ use datafusion::arrow::datatypes::DataType;
4
+ use datafusion::common::{plan_err, Result, ScalarValue};
5
+ use datafusion::logical_expr::{
6
+ ColumnarValue, ScalarFunctionArgs, ScalarUDFImpl, Signature, Volatility,
7
+ };
8
+
9
+ use crate::functions::FunctionProviderHandle;
10
+
11
+ #[derive(Clone)]
12
+ pub(super) struct LixTimestamp {
13
+ pub(super) functions: FunctionProviderHandle,
14
+ }
15
+
16
+ impl PartialEq for LixTimestamp {
17
+ fn eq(&self, _other: &Self) -> bool {
18
+ true
19
+ }
20
+ }
21
+
22
+ impl Eq for LixTimestamp {}
23
+
24
+ impl std::hash::Hash for LixTimestamp {
25
+ fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
26
+ self.name().hash(state);
27
+ }
28
+ }
29
+
30
+ impl std::fmt::Debug for LixTimestamp {
31
+ fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
32
+ f.debug_struct("LixTimestamp").finish()
33
+ }
34
+ }
35
+
36
+ impl ScalarUDFImpl for LixTimestamp {
37
+ fn as_any(&self) -> &dyn Any {
38
+ self
39
+ }
40
+
41
+ fn name(&self) -> &str {
42
+ "lix_timestamp"
43
+ }
44
+
45
+ fn signature(&self) -> &Signature {
46
+ static SIGNATURE: std::sync::LazyLock<Signature> =
47
+ std::sync::LazyLock::new(|| Signature::nullary(Volatility::Volatile));
48
+ &SIGNATURE
49
+ }
50
+
51
+ fn return_type(&self, _arg_types: &[DataType]) -> Result<DataType> {
52
+ Ok(DataType::Utf8)
53
+ }
54
+
55
+ fn invoke_with_args(&self, args: ScalarFunctionArgs) -> Result<ColumnarValue> {
56
+ if !args.args.is_empty() {
57
+ return plan_err!("lix_timestamp requires no arguments");
58
+ }
59
+ Ok(ColumnarValue::Scalar(ScalarValue::Utf8(Some(
60
+ self.functions.call_timestamp(),
61
+ ))))
62
+ }
63
+ }
64
+
65
+ #[cfg(test)]
66
+ mod tests {
67
+ use super::super::test_support::single_text;
68
+
69
+ #[tokio::test]
70
+ async fn returns_timestamp_text() {
71
+ let value = single_text("SELECT lix_timestamp()")
72
+ .await
73
+ .expect("timestamp should not be null");
74
+ assert!(!value.is_empty());
75
+ }
76
+ }
@@ -6,13 +6,17 @@ mod lix_json_get;
6
6
  mod lix_json_get_text;
7
7
  mod lix_text_decode;
8
8
  mod lix_text_encode;
9
+ mod lix_timestamp;
9
10
  mod lix_uuid_v7;
11
+ mod public_call;
10
12
 
11
13
  use datafusion::execution::context::SessionContext;
12
14
  use datafusion::logical_expr::ScalarUDF;
13
15
 
14
16
  use crate::functions::FunctionProviderHandle;
15
17
 
18
+ pub(crate) use public_call::validate_public_udf_calls_in_datafusion_statement;
19
+
16
20
  #[cfg(test)]
17
21
  pub(crate) fn system_sql2_function_provider() -> FunctionProviderHandle {
18
22
  use crate::functions::{FunctionProvider, SharedFunctionProvider, SystemFunctionProvider};
@@ -34,7 +38,10 @@ pub(crate) fn register_sql2_functions(
34
38
  ctx.register_udf(ScalarUDF::from(lix_text_encode::LixTextEncode::new()));
35
39
  ctx.register_udf(ScalarUDF::from(lix_json::LixJson));
36
40
  ctx.register_udf(ScalarUDF::from(lix_empty_blob::LixEmptyBlob));
37
- ctx.register_udf(ScalarUDF::from(lix_uuid_v7::LixUuidV7 { functions }));
41
+ ctx.register_udf(ScalarUDF::from(lix_uuid_v7::LixUuidV7 {
42
+ functions: functions.clone(),
43
+ }));
44
+ ctx.register_udf(ScalarUDF::from(lix_timestamp::LixTimestamp { functions }));
38
45
  }
39
46
 
40
47
  #[cfg(test)]
@@ -0,0 +1,238 @@
1
+ use std::ops::ControlFlow;
2
+
3
+ use datafusion::sql::parser::Statement as DataFusionStatement;
4
+ use datafusion::sql::sqlparser::ast::{
5
+ Expr, Function, FunctionArg, FunctionArgExpr, FunctionArguments, ObjectNamePart, Statement,
6
+ Value, Visit, Visitor,
7
+ };
8
+ #[cfg(test)]
9
+ use datafusion::sql::sqlparser::dialect::GenericDialect;
10
+ #[cfg(test)]
11
+ use datafusion::sql::sqlparser::parser::Parser;
12
+
13
+ use crate::LixError;
14
+
15
+ #[cfg(test)]
16
+ pub(crate) fn validate_public_udf_calls(sql: &str) -> Result<(), LixError> {
17
+ let statements = Parser::parse_sql(&GenericDialect {}, sql).map_err(|error| {
18
+ LixError::new(
19
+ LixError::CODE_PARSE_ERROR,
20
+ format!("sql2 SQL parse error: {error}"),
21
+ )
22
+ })?;
23
+
24
+ let mut visitor = PublicUdfCallVisitor;
25
+ match statements.visit(&mut visitor) {
26
+ ControlFlow::Continue(()) => Ok(()),
27
+ ControlFlow::Break(error) => Err(*error),
28
+ }
29
+ }
30
+
31
+ struct PublicUdfCallVisitor;
32
+
33
+ impl Visitor for PublicUdfCallVisitor {
34
+ type Break = Box<LixError>;
35
+
36
+ fn pre_visit_expr(&mut self, expr: &Expr) -> ControlFlow<Self::Break> {
37
+ let Expr::Function(function) = expr else {
38
+ return ControlFlow::Continue(());
39
+ };
40
+
41
+ match validate_public_function_call(function) {
42
+ Ok(()) => ControlFlow::Continue(()),
43
+ Err(error) => ControlFlow::Break(Box::new(error)),
44
+ }
45
+ }
46
+
47
+ fn pre_visit_statement(&mut self, statement: &Statement) -> ControlFlow<Self::Break> {
48
+ match statement {
49
+ Statement::CreateFunction(_) | Statement::DropFunction(_) => ControlFlow::Continue(()),
50
+ _ => ControlFlow::Continue(()),
51
+ }
52
+ }
53
+ }
54
+
55
+ fn validate_public_function_call(function: &Function) -> Result<(), LixError> {
56
+ let Some(name) = public_lix_function_name(function) else {
57
+ return Ok(());
58
+ };
59
+ let arity = function_arity(&function.args);
60
+
61
+ match name {
62
+ "lix_json" => expect_exact_arity(name, arity, 1),
63
+ "lix_empty_blob" => expect_exact_arity(name, arity, 0),
64
+ "lix_timestamp" => expect_exact_arity(name, arity, 0),
65
+ "lix_uuid_v7" => expect_exact_arity(name, arity, 0),
66
+ "lix_active_version_commit_id" => expect_exact_arity(name, arity, 0),
67
+ "lix_text_encode" | "lix_text_decode" => {
68
+ expect_arity_range(name, arity, 1, 2)?;
69
+ validate_literal_utf8_encoding(name, &function.args)
70
+ }
71
+ _ => Ok(()),
72
+ }
73
+ }
74
+
75
+ pub(crate) fn validate_public_udf_calls_in_datafusion_statement(
76
+ statement: &DataFusionStatement,
77
+ ) -> Result<(), LixError> {
78
+ let mut visitor = PublicUdfCallVisitor;
79
+ visit_datafusion_statement(statement, &mut visitor)
80
+ }
81
+
82
+ fn visit_datafusion_statement(
83
+ statement: &DataFusionStatement,
84
+ visitor: &mut PublicUdfCallVisitor,
85
+ ) -> Result<(), LixError> {
86
+ match statement {
87
+ DataFusionStatement::Statement(statement) => match statement.visit(visitor) {
88
+ ControlFlow::Continue(()) => Ok(()),
89
+ ControlFlow::Break(error) => Err(*error),
90
+ },
91
+ DataFusionStatement::Explain(explain) => {
92
+ visit_datafusion_statement(explain.statement.as_ref(), visitor)
93
+ }
94
+ _ => Ok(()),
95
+ }
96
+ }
97
+
98
+ fn public_lix_function_name(function: &Function) -> Option<&'static str> {
99
+ let part = function.name.0.last()?;
100
+ let ident = match part {
101
+ ObjectNamePart::Identifier(ident) => ident.value.as_str(),
102
+ ObjectNamePart::Function(_) => return None,
103
+ };
104
+ match ident.to_ascii_lowercase().as_str() {
105
+ "lix_json" => Some("lix_json"),
106
+ "lix_empty_blob" => Some("lix_empty_blob"),
107
+ "lix_timestamp" => Some("lix_timestamp"),
108
+ "lix_uuid_v7" => Some("lix_uuid_v7"),
109
+ "lix_active_version_commit_id" => Some("lix_active_version_commit_id"),
110
+ "lix_text_encode" => Some("lix_text_encode"),
111
+ "lix_text_decode" => Some("lix_text_decode"),
112
+ _ => None,
113
+ }
114
+ }
115
+
116
+ fn function_arity(args: &FunctionArguments) -> usize {
117
+ match args {
118
+ FunctionArguments::None => 0,
119
+ FunctionArguments::Subquery(_) => 1,
120
+ FunctionArguments::List(list) => list.args.len(),
121
+ }
122
+ }
123
+
124
+ fn expect_exact_arity(name: &str, actual: usize, expected: usize) -> Result<(), LixError> {
125
+ if actual == expected {
126
+ return Ok(());
127
+ }
128
+
129
+ let expectation = if expected == 0 {
130
+ "no arguments".to_string()
131
+ } else if expected == 1 {
132
+ "exactly 1 argument".to_string()
133
+ } else {
134
+ format!("exactly {expected} arguments")
135
+ };
136
+ Err(invalid_param(format!("{name} requires {expectation}")))
137
+ }
138
+
139
+ fn expect_arity_range(name: &str, actual: usize, min: usize, max: usize) -> Result<(), LixError> {
140
+ if (min..=max).contains(&actual) {
141
+ return Ok(());
142
+ }
143
+ Err(invalid_param(format!(
144
+ "{name} requires {min} or {max} arguments"
145
+ )))
146
+ }
147
+
148
+ fn validate_literal_utf8_encoding(name: &str, args: &FunctionArguments) -> Result<(), LixError> {
149
+ let Some(encoding) = function_arg(args, 1) else {
150
+ return Ok(());
151
+ };
152
+ let Some(value) = string_literal_arg(encoding) else {
153
+ return Ok(());
154
+ };
155
+ let normalized = value.trim().to_ascii_uppercase().replace('-', "");
156
+ if normalized == "UTF8" {
157
+ Ok(())
158
+ } else {
159
+ Err(invalid_param(format!(
160
+ "{name}() only supports UTF8 encoding, got '{value}'"
161
+ )))
162
+ }
163
+ }
164
+
165
+ fn function_arg(args: &FunctionArguments, index: usize) -> Option<&FunctionArg> {
166
+ match args {
167
+ FunctionArguments::List(list) => list.args.get(index),
168
+ _ => None,
169
+ }
170
+ }
171
+
172
+ fn string_literal_arg(arg: &FunctionArg) -> Option<&str> {
173
+ let expr = match arg {
174
+ FunctionArg::Unnamed(FunctionArgExpr::Expr(expr))
175
+ | FunctionArg::Named {
176
+ arg: FunctionArgExpr::Expr(expr),
177
+ ..
178
+ }
179
+ | FunctionArg::ExprNamed {
180
+ arg: FunctionArgExpr::Expr(expr),
181
+ ..
182
+ } => expr,
183
+ _ => return None,
184
+ };
185
+ let Expr::Value(value) = expr else {
186
+ return None;
187
+ };
188
+ match &value.value {
189
+ Value::SingleQuotedString(value)
190
+ | Value::DoubleQuotedString(value)
191
+ | Value::TripleSingleQuotedString(value)
192
+ | Value::TripleDoubleQuotedString(value)
193
+ | Value::EscapedStringLiteral(value)
194
+ | Value::UnicodeStringLiteral(value)
195
+ | Value::NationalStringLiteral(value)
196
+ | Value::SingleQuotedRawStringLiteral(value)
197
+ | Value::DoubleQuotedRawStringLiteral(value)
198
+ | Value::TripleSingleQuotedRawStringLiteral(value)
199
+ | Value::TripleDoubleQuotedRawStringLiteral(value) => Some(value.as_str()),
200
+ Value::DollarQuotedString(value) => Some(value.value.as_str()),
201
+ _ => None,
202
+ }
203
+ }
204
+
205
+ fn invalid_param(message: impl Into<String>) -> LixError {
206
+ LixError::new(LixError::CODE_INVALID_PARAM, message)
207
+ }
208
+
209
+ #[cfg(test)]
210
+ mod tests {
211
+ use super::validate_public_udf_calls;
212
+
213
+ #[test]
214
+ fn rejects_lix_udf_wrong_arity_as_public_invalid_param() {
215
+ let error = validate_public_udf_calls("SELECT lix_uuid_v7('extra')")
216
+ .expect_err("wrong arity should be rejected");
217
+ assert_eq!(error.code, "LIX_INVALID_PARAM");
218
+ assert!(error.message.contains("lix_uuid_v7 requires no arguments"));
219
+ }
220
+
221
+ #[test]
222
+ fn rejects_unsupported_literal_encoding_as_public_invalid_param() {
223
+ let error = validate_public_udf_calls("SELECT lix_text_encode('Ada', 'base64')")
224
+ .expect_err("unsupported encoding should be rejected");
225
+ assert_eq!(error.code, "LIX_INVALID_PARAM");
226
+ assert!(error
227
+ .message
228
+ .contains("lix_text_encode() only supports UTF8 encoding"));
229
+ }
230
+
231
+ #[test]
232
+ fn accepts_valid_public_lix_udf_calls() {
233
+ validate_public_udf_calls(
234
+ "SELECT lix_json('{\"x\":1}'), lix_text_decode(X'416461', 'utf-8')",
235
+ )
236
+ .expect("valid calls should pass public validation");
237
+ }
238
+ }