@lix-js/sdk 0.6.0-preview.4 → 0.6.0-preview.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (234) hide show
  1. package/README.md +1 -1
  2. package/SKILL.md +65 -64
  3. package/dist/engine-wasm/index.js +4 -4
  4. package/dist/engine-wasm/wasm/lix_engine.d.ts +5 -5
  5. package/dist/engine-wasm/wasm/lix_engine.js +130 -118
  6. package/dist/engine-wasm/wasm/lix_engine.wasm +0 -0
  7. package/dist/engine-wasm/wasm/lix_engine.wasm.d.ts +9 -8
  8. package/dist/generated/builtin-schemas.d.ts +69 -69
  9. package/dist/generated/builtin-schemas.js +94 -94
  10. package/dist/open-lix.d.ts +33 -26
  11. package/dist/open-lix.js +10 -10
  12. package/dist/sqlite/index.js +86 -30
  13. package/dist-engine-src/README.md +3 -3
  14. package/dist-engine-src/src/backend/capabilities.rs +67 -0
  15. package/dist-engine-src/src/backend/conformance/baseline.rs +1127 -0
  16. package/dist-engine-src/src/backend/conformance/factory.rs +93 -0
  17. package/dist-engine-src/src/backend/conformance/failure_tests.rs +608 -0
  18. package/dist-engine-src/src/backend/conformance/fixtures.rs +26 -0
  19. package/dist-engine-src/src/backend/conformance/mod.rs +75 -0
  20. package/dist-engine-src/src/backend/conformance/model.rs +28 -0
  21. package/dist-engine-src/src/backend/conformance/model_based.rs +257 -0
  22. package/dist-engine-src/src/backend/conformance/persistence.rs +204 -0
  23. package/dist-engine-src/src/backend/conformance/projection.rs +21 -0
  24. package/dist-engine-src/src/backend/conformance/pushdown.rs +24 -0
  25. package/dist-engine-src/src/backend/conformance/runner.rs +90 -0
  26. package/dist-engine-src/src/backend/conformance/scan.rs +24 -0
  27. package/dist-engine-src/src/backend/conformance/write.rs +16 -0
  28. package/dist-engine-src/src/backend/error.rs +94 -0
  29. package/dist-engine-src/src/backend/in_memory.rs +670 -0
  30. package/dist-engine-src/src/backend/mod.rs +36 -9
  31. package/dist-engine-src/src/backend/predicate.rs +80 -0
  32. package/dist-engine-src/src/backend/traits.rs +260 -0
  33. package/dist-engine-src/src/backend/types.rs +224 -81
  34. package/dist-engine-src/src/binary_cas/context.rs +8 -8
  35. package/dist-engine-src/src/binary_cas/kv.rs +234 -259
  36. package/dist-engine-src/src/{version → branch}/context.rs +12 -12
  37. package/dist-engine-src/src/branch/lifecycle.rs +221 -0
  38. package/dist-engine-src/src/branch/mod.rs +13 -0
  39. package/dist-engine-src/src/branch/refs.rs +321 -0
  40. package/dist-engine-src/src/branch/stage_rows.rs +67 -0
  41. package/dist-engine-src/src/branch/types.rs +21 -0
  42. package/dist-engine-src/src/catalog/context.rs +18 -18
  43. package/dist-engine-src/src/catalog/snapshot.rs +8 -8
  44. package/dist-engine-src/src/changelog/bench_support.rs +785 -0
  45. package/dist-engine-src/src/changelog/change.rs +1 -0
  46. package/dist-engine-src/src/changelog/codec.rs +497 -0
  47. package/dist-engine-src/src/changelog/commit.rs +1 -0
  48. package/dist-engine-src/src/changelog/context.rs +1614 -0
  49. package/dist-engine-src/src/changelog/mod.rs +29 -0
  50. package/dist-engine-src/src/changelog/store.rs +163 -0
  51. package/dist-engine-src/src/changelog/test_support.rs +54 -0
  52. package/dist-engine-src/src/changelog/types.rs +213 -0
  53. package/dist-engine-src/src/commit_graph/context.rs +317 -274
  54. package/dist-engine-src/src/commit_graph/mod.rs +2 -4
  55. package/dist-engine-src/src/commit_graph/types.rs +22 -42
  56. package/dist-engine-src/src/commit_graph/walker.rs +133 -103
  57. package/dist-engine-src/src/common/error.rs +52 -18
  58. package/dist-engine-src/src/common/identity.rs +2 -2
  59. package/dist-engine-src/src/common/mod.rs +1 -1
  60. package/dist-engine-src/src/domain.rs +42 -46
  61. package/dist-engine-src/src/engine.rs +74 -96
  62. package/dist-engine-src/src/{entity_identity.rs → entity_pk.rs} +89 -92
  63. package/dist-engine-src/src/functions/context.rs +56 -52
  64. package/dist-engine-src/src/functions/state.rs +51 -52
  65. package/dist-engine-src/src/init.rs +288 -154
  66. package/dist-engine-src/src/json_store/context.rs +15 -266
  67. package/dist-engine-src/src/json_store/mod.rs +26 -0
  68. package/dist-engine-src/src/json_store/store.rs +103 -718
  69. package/dist-engine-src/src/json_store/types.rs +4 -9
  70. package/dist-engine-src/src/lib.rs +49 -19
  71. package/dist-engine-src/src/live_state/context.rs +654 -790
  72. package/dist-engine-src/src/live_state/mod.rs +9 -3
  73. package/dist-engine-src/src/live_state/overlay.rs +4 -4
  74. package/dist-engine-src/src/live_state/types.rs +30 -21
  75. package/dist-engine-src/src/live_state/visibility.rs +514 -71
  76. package/dist-engine-src/src/plugin/install.rs +48 -48
  77. package/dist-engine-src/src/plugin/manifest.rs +7 -7
  78. package/dist-engine-src/src/plugin/materializer.rs +0 -275
  79. package/dist-engine-src/src/plugin/plugin_manifest.json +4 -3
  80. package/dist-engine-src/src/schema/builtin/lix_binary_blob_ref.json +2 -2
  81. package/dist-engine-src/src/schema/builtin/lix_branch_descriptor.json +34 -0
  82. package/dist-engine-src/src/schema/builtin/lix_branch_ref.json +48 -0
  83. package/dist-engine-src/src/schema/builtin/lix_change.json +3 -3
  84. package/dist-engine-src/src/schema/builtin/lix_commit.json +1 -1
  85. package/dist-engine-src/src/schema/builtin/lix_label_assignment.json +6 -6
  86. package/dist-engine-src/src/schema/builtin/mod.rs +18 -20
  87. package/dist-engine-src/src/schema/compatibility.rs +11 -11
  88. package/dist-engine-src/src/schema/definition.json +2 -2
  89. package/dist-engine-src/src/schema/definition.rs +5 -5
  90. package/dist-engine-src/src/schema/key.rs +3 -3
  91. package/dist-engine-src/src/schema/mod.rs +1 -1
  92. package/dist-engine-src/src/schema/tests.rs +18 -18
  93. package/dist-engine-src/src/session/context.rs +803 -148
  94. package/dist-engine-src/src/session/create_branch.rs +94 -0
  95. package/dist-engine-src/src/session/execute.rs +223 -83
  96. package/dist-engine-src/src/session/merge/analysis.rs +9 -3
  97. package/dist-engine-src/src/session/merge/{version.rs → branch.rs} +119 -129
  98. package/dist-engine-src/src/session/merge/conflicts.rs +2 -2
  99. package/dist-engine-src/src/session/merge/mod.rs +5 -6
  100. package/dist-engine-src/src/session/merge/stats.rs +7 -11
  101. package/dist-engine-src/src/session/mod.rs +15 -12
  102. package/dist-engine-src/src/session/switch_branch.rs +113 -0
  103. package/dist-engine-src/src/session/transaction.rs +495 -14
  104. package/dist-engine-src/src/sql2/{classify.rs → bind/classify.rs} +3 -75
  105. package/dist-engine-src/src/sql2/bind/error.rs +5 -0
  106. package/dist-engine-src/src/sql2/bind/expr.rs +29 -0
  107. package/dist-engine-src/src/sql2/bind/mod.rs +12 -0
  108. package/dist-engine-src/src/sql2/{udfs/public_call.rs → bind/public_udf.rs} +71 -3
  109. package/dist-engine-src/src/sql2/bind/read.rs +65 -0
  110. package/dist-engine-src/src/sql2/bind/statement.rs +2236 -0
  111. package/dist-engine-src/src/sql2/bind/table.rs +273 -0
  112. package/dist-engine-src/src/sql2/bind/write.rs +86 -0
  113. package/dist-engine-src/src/sql2/branch_scope.rs +436 -0
  114. package/dist-engine-src/src/sql2/catalog/capability.rs +20 -0
  115. package/dist-engine-src/src/sql2/catalog/entity_surface.rs +296 -0
  116. package/dist-engine-src/src/sql2/catalog/mod.rs +15 -0
  117. package/dist-engine-src/src/sql2/catalog/registry.rs +556 -0
  118. package/dist-engine-src/src/sql2/catalog/schema.rs +88 -0
  119. package/dist-engine-src/src/sql2/catalog/surface.rs +41 -0
  120. package/dist-engine-src/src/sql2/change_materialization.rs +122 -0
  121. package/dist-engine-src/src/sql2/context.rs +36 -30
  122. package/dist-engine-src/src/sql2/error.rs +1 -1
  123. package/dist-engine-src/src/sql2/exec/bound_public_write.rs +1593 -0
  124. package/dist-engine-src/src/sql2/exec/datafusion.rs +5266 -0
  125. package/dist-engine-src/src/sql2/exec/fast_write.rs +82 -0
  126. package/dist-engine-src/src/sql2/exec/mod.rs +24 -0
  127. package/dist-engine-src/src/sql2/exec/write.rs +661 -0
  128. package/dist-engine-src/src/sql2/filesystem_planner.rs +72 -77
  129. package/dist-engine-src/src/sql2/filesystem_visibility.rs +21 -21
  130. package/dist-engine-src/src/sql2/history_projection.rs +8 -8
  131. package/dist-engine-src/src/sql2/history_route.rs +35 -31
  132. package/dist-engine-src/src/sql2/mod.rs +28 -23
  133. package/dist-engine-src/src/sql2/optimize/datafusion.rs +1 -0
  134. package/dist-engine-src/src/sql2/optimize/mod.rs +2 -0
  135. package/dist-engine-src/src/sql2/optimize/simple_write.rs +116 -0
  136. package/dist-engine-src/src/sql2/parse/mod.rs +69 -0
  137. package/dist-engine-src/src/sql2/parse/normalize.rs +1 -0
  138. package/dist-engine-src/src/sql2/plan/branch_scope.rs +24 -0
  139. package/dist-engine-src/src/sql2/plan/mod.rs +5 -0
  140. package/dist-engine-src/src/sql2/plan/predicate.rs +22 -0
  141. package/dist-engine-src/src/sql2/plan/write.rs +147 -0
  142. package/dist-engine-src/src/sql2/predicate_typecheck.rs +258 -0
  143. package/dist-engine-src/src/sql2/{version_provider.rs → providers/branch.rs} +218 -214
  144. package/dist-engine-src/src/sql2/{change_provider.rs → providers/change.rs} +156 -42
  145. package/dist-engine-src/src/sql2/{directory_provider.rs → providers/directory.rs} +291 -322
  146. package/dist-engine-src/src/sql2/{directory_history_provider.rs → providers/directory_history.rs} +56 -42
  147. package/dist-engine-src/src/sql2/providers/entity.rs +1484 -0
  148. package/dist-engine-src/src/sql2/{entity_history_provider.rs → providers/entity_history.rs} +43 -31
  149. package/dist-engine-src/src/sql2/{file_provider.rs → providers/file.rs} +323 -316
  150. package/dist-engine-src/src/sql2/{file_history_provider.rs → providers/file_history.rs} +60 -46
  151. package/dist-engine-src/src/sql2/{history_provider.rs → providers/history.rs} +46 -32
  152. package/dist-engine-src/src/sql2/{lix_state_provider.rs → providers/lix_state.rs} +359 -329
  153. package/dist-engine-src/src/sql2/providers/mod.rs +508 -0
  154. package/dist-engine-src/src/sql2/read_only.rs +2 -2
  155. package/dist-engine-src/src/sql2/session.rs +47 -96
  156. package/dist-engine-src/src/sql2/storage/constraints.rs +1 -0
  157. package/dist-engine-src/src/sql2/storage/mod.rs +1 -0
  158. package/dist-engine-src/src/sql2/test_support/differential.rs +712 -0
  159. package/dist-engine-src/src/sql2/test_support/generators.rs +354 -0
  160. package/dist-engine-src/src/sql2/test_support/mod.rs +2 -0
  161. package/dist-engine-src/src/sql2/udfs/{lix_active_version_commit_id.rs → lix_active_branch_commit_id.rs} +7 -7
  162. package/dist-engine-src/src/sql2/udfs/mod.rs +3 -6
  163. package/dist-engine-src/src/sql2/write_normalization.rs +45 -22
  164. package/dist-engine-src/src/storage/conformance.rs +399 -0
  165. package/dist-engine-src/src/storage/context.rs +552 -288
  166. package/dist-engine-src/src/storage/mod.rs +48 -10
  167. package/dist-engine-src/src/storage/point.rs +440 -0
  168. package/dist-engine-src/src/storage/read_scope.rs +43 -64
  169. package/dist-engine-src/src/storage/reader.rs +867 -0
  170. package/dist-engine-src/src/storage/scan.rs +784 -0
  171. package/dist-engine-src/src/storage/spaces.rs +236 -0
  172. package/dist-engine-src/src/storage/stats.rs +80 -0
  173. package/dist-engine-src/src/storage/write_set.rs +962 -0
  174. package/dist-engine-src/src/storage_bench.rs +136 -4828
  175. package/dist-engine-src/src/test_support.rs +360 -138
  176. package/dist-engine-src/src/tracked_state/bench_support.rs +394 -0
  177. package/dist-engine-src/src/tracked_state/codec.rs +155 -1057
  178. package/dist-engine-src/src/tracked_state/commit_root_rebuild.rs +358 -0
  179. package/dist-engine-src/src/tracked_state/context.rs +1927 -993
  180. package/dist-engine-src/src/tracked_state/diff.rs +1715 -261
  181. package/dist-engine-src/src/tracked_state/merge.rs +74 -88
  182. package/dist-engine-src/src/tracked_state/mod.rs +19 -16
  183. package/dist-engine-src/src/tracked_state/{materialization.rs → row_materialization.rs} +50 -178
  184. package/dist-engine-src/src/tracked_state/storage.rs +243 -191
  185. package/dist-engine-src/src/tracked_state/tree.rs +247 -371
  186. package/dist-engine-src/src/tracked_state/types.rs +49 -42
  187. package/dist-engine-src/src/transaction/bench_support.rs +407 -0
  188. package/dist-engine-src/src/transaction/commit.rs +821 -713
  189. package/dist-engine-src/src/transaction/context.rs +705 -600
  190. package/dist-engine-src/src/transaction/mod.rs +13 -2
  191. package/dist-engine-src/src/transaction/normalization.rs +63 -76
  192. package/dist-engine-src/src/transaction/prep.rs +13 -13
  193. package/dist-engine-src/src/transaction/schema_resolver.rs +19 -5
  194. package/dist-engine-src/src/transaction/staging.rs +228 -434
  195. package/dist-engine-src/src/transaction/types.rs +41 -98
  196. package/dist-engine-src/src/transaction/validation.rs +382 -446
  197. package/dist-engine-src/src/untracked_state/codec.rs +337 -29
  198. package/dist-engine-src/src/untracked_state/context.rs +7 -7
  199. package/dist-engine-src/src/untracked_state/materialization.rs +2 -2
  200. package/dist-engine-src/src/untracked_state/mod.rs +1 -1
  201. package/dist-engine-src/src/untracked_state/storage.rs +659 -157
  202. package/dist-engine-src/src/untracked_state/types.rs +21 -21
  203. package/package.json +71 -68
  204. package/dist-engine-src/src/backend/kv.rs +0 -358
  205. package/dist-engine-src/src/backend/testing.rs +0 -658
  206. package/dist-engine-src/src/commit_store/codec.rs +0 -887
  207. package/dist-engine-src/src/commit_store/context.rs +0 -944
  208. package/dist-engine-src/src/commit_store/materialization.rs +0 -84
  209. package/dist-engine-src/src/commit_store/mod.rs +0 -16
  210. package/dist-engine-src/src/commit_store/storage.rs +0 -600
  211. package/dist-engine-src/src/commit_store/types.rs +0 -215
  212. package/dist-engine-src/src/schema/builtin/lix_version_descriptor.json +0 -34
  213. package/dist-engine-src/src/schema/builtin/lix_version_ref.json +0 -48
  214. package/dist-engine-src/src/session/create_version.rs +0 -88
  215. package/dist-engine-src/src/session/merge/apply.rs +0 -23
  216. package/dist-engine-src/src/session/optimization9_sql2_bench.rs +0 -100
  217. package/dist-engine-src/src/session/switch_version.rs +0 -110
  218. package/dist-engine-src/src/sql2/entity_provider.rs +0 -3211
  219. package/dist-engine-src/src/sql2/execute.rs +0 -3533
  220. package/dist-engine-src/src/sql2/public_bind/assignment.rs +0 -46
  221. package/dist-engine-src/src/sql2/public_bind/capability.rs +0 -41
  222. package/dist-engine-src/src/sql2/public_bind/dml.rs +0 -172
  223. package/dist-engine-src/src/sql2/public_bind/mod.rs +0 -26
  224. package/dist-engine-src/src/sql2/public_bind/table.rs +0 -168
  225. package/dist-engine-src/src/sql2/version_scope.rs +0 -394
  226. package/dist-engine-src/src/storage/types.rs +0 -501
  227. package/dist-engine-src/src/tracked_state/by_file_index.rs +0 -98
  228. package/dist-engine-src/src/tracked_state/materializer.rs +0 -488
  229. package/dist-engine-src/src/transaction/live_state_overlay.rs +0 -35
  230. package/dist-engine-src/src/version/lifecycle.rs +0 -221
  231. package/dist-engine-src/src/version/mod.rs +0 -13
  232. package/dist-engine-src/src/version/refs.rs +0 -330
  233. package/dist-engine-src/src/version/stage_rows.rs +0 -67
  234. package/dist-engine-src/src/version/types.rs +0 -21
@@ -0,0 +1,296 @@
1
+ use std::collections::BTreeSet;
2
+ use std::sync::Arc;
3
+
4
+ use datafusion::arrow::datatypes::{DataType, Field, Schema, SchemaRef};
5
+ use serde_json::Value as JsonValue;
6
+
7
+ use crate::sql2::history_route::{
8
+ HISTORY_COL_CHANGE_ID, HISTORY_COL_COMMIT_CREATED_AT, HISTORY_COL_DEPTH, HISTORY_COL_ENTITY_PK,
9
+ HISTORY_COL_FILE_ID, HISTORY_COL_METADATA, HISTORY_COL_OBSERVED_COMMIT_ID,
10
+ HISTORY_COL_SCHEMA_KEY, HISTORY_COL_SNAPSHOT_CONTENT, HISTORY_COL_START_COMMIT_ID,
11
+ };
12
+ use crate::sql2::result_metadata::{json_field, mark_json_field};
13
+ use crate::LixError;
14
+
15
+ #[derive(Debug, Clone, Copy, PartialEq, Eq)]
16
+ pub(crate) enum EntitySurfaceShape {
17
+ Active,
18
+ ByBranch,
19
+ History,
20
+ }
21
+
22
+ #[derive(Debug, Clone, Copy, PartialEq, Eq)]
23
+ pub(crate) enum EntityColumnType {
24
+ String,
25
+ Json,
26
+ Integer,
27
+ Number,
28
+ Boolean,
29
+ }
30
+
31
+ #[derive(Debug, Clone, PartialEq, Eq)]
32
+ pub(crate) struct EntitySurfaceColumn {
33
+ pub(crate) name: String,
34
+ pub(crate) column_type: EntityColumnType,
35
+ }
36
+
37
+ #[derive(Debug, Clone, PartialEq, Eq)]
38
+ pub(crate) struct EntitySurfaceSpec {
39
+ pub(crate) schema_key: String,
40
+ pub(crate) primary_key_paths: Vec<Vec<String>>,
41
+ pub(crate) columns: Vec<EntitySurfaceColumn>,
42
+ }
43
+
44
+ impl EntitySurfaceSpec {
45
+ #[cfg(test)]
46
+ pub(crate) fn visible_column_names(&self) -> impl Iterator<Item = &str> {
47
+ self.columns.iter().map(|column| column.name.as_str())
48
+ }
49
+
50
+ pub(crate) fn visible_column(&self, column_name: &str) -> Option<&EntitySurfaceColumn> {
51
+ self.columns
52
+ .iter()
53
+ .find(|column| column.name == column_name)
54
+ }
55
+ }
56
+
57
+ pub(crate) fn derive_entity_surface_spec_from_schema(
58
+ schema: &JsonValue,
59
+ ) -> Result<EntitySurfaceSpec, LixError> {
60
+ let schema_key = schema
61
+ .get("x-lix-key")
62
+ .and_then(JsonValue::as_str)
63
+ .ok_or_else(|| {
64
+ LixError::new(
65
+ "LIX_ERROR_UNKNOWN",
66
+ "schema is missing string x-lix-key".to_string(),
67
+ )
68
+ })?;
69
+
70
+ let properties = schema
71
+ .get("properties")
72
+ .and_then(JsonValue::as_object)
73
+ .ok_or_else(|| {
74
+ LixError::new(
75
+ LixError::CODE_SCHEMA_DEFINITION,
76
+ format!("schema '{schema_key}' must define object properties"),
77
+ )
78
+ })?;
79
+
80
+ let mut columns = properties
81
+ .iter()
82
+ .filter(|(key, _)| !key.starts_with("lixcol_"))
83
+ .map(|(key, property_schema)| {
84
+ let column_type = entity_column_type_from_schema(property_schema).ok_or_else(|| {
85
+ LixError::new(
86
+ LixError::CODE_SCHEMA_DEFINITION,
87
+ format!(
88
+ "schema '{schema_key}' property '/{key}' must declare a SQL-projectable JSON Schema type"
89
+ ),
90
+ )
91
+ .with_hint("Use an explicit type such as string, number, integer, boolean, object, array, or a supported union of those types.")
92
+ })?;
93
+ Ok(EntitySurfaceColumn {
94
+ name: key.clone(),
95
+ column_type,
96
+ })
97
+ })
98
+ .collect::<Result<Vec<_>, LixError>>()?;
99
+ columns.sort_by(|left, right| left.name.cmp(&right.name));
100
+
101
+ let primary_key_paths = parse_primary_key_paths(schema)?;
102
+
103
+ Ok(EntitySurfaceSpec {
104
+ schema_key: schema_key.to_string(),
105
+ primary_key_paths,
106
+ columns,
107
+ })
108
+ }
109
+
110
+ pub(crate) fn schema_exposed_as_entity_surface(schema_key: &str) -> bool {
111
+ !matches!(schema_key, "lix_active_account" | "lix_change")
112
+ }
113
+
114
+ pub(crate) fn schema_exposed_as_entity_history_surface(schema_key: &str) -> bool {
115
+ !matches!(schema_key, "lix_commit" | "lix_commit_edge")
116
+ }
117
+
118
+ pub(crate) fn entity_surface_schema(
119
+ spec: &EntitySurfaceSpec,
120
+ shape: EntitySurfaceShape,
121
+ ) -> SchemaRef {
122
+ let mut fields = spec
123
+ .columns
124
+ .iter()
125
+ .map(|column| {
126
+ let field = Field::new(
127
+ &column.name,
128
+ arrow_data_type_for_entity_column_type(column.column_type),
129
+ true,
130
+ );
131
+ if column.column_type == EntityColumnType::Json {
132
+ mark_json_field(field)
133
+ } else {
134
+ field
135
+ }
136
+ })
137
+ .collect::<Vec<_>>();
138
+
139
+ fields.extend(entity_system_fields(shape));
140
+ Arc::new(Schema::new(fields))
141
+ }
142
+
143
+ pub(crate) fn entity_system_fields(shape: EntitySurfaceShape) -> Vec<Field> {
144
+ if shape == EntitySurfaceShape::History {
145
+ return vec![
146
+ json_field(HISTORY_COL_ENTITY_PK, false),
147
+ Field::new(HISTORY_COL_SCHEMA_KEY, DataType::Utf8, false),
148
+ Field::new(HISTORY_COL_FILE_ID, DataType::Utf8, true),
149
+ json_field(HISTORY_COL_SNAPSHOT_CONTENT, true),
150
+ json_field(HISTORY_COL_METADATA, true),
151
+ Field::new(HISTORY_COL_CHANGE_ID, DataType::Utf8, false),
152
+ Field::new(HISTORY_COL_OBSERVED_COMMIT_ID, DataType::Utf8, false),
153
+ Field::new(HISTORY_COL_COMMIT_CREATED_AT, DataType::Utf8, false),
154
+ Field::new(HISTORY_COL_START_COMMIT_ID, DataType::Utf8, false),
155
+ Field::new(HISTORY_COL_DEPTH, DataType::Int64, false),
156
+ ];
157
+ }
158
+
159
+ let mut fields = vec![
160
+ json_field("lixcol_entity_pk", true),
161
+ Field::new("lixcol_schema_key", DataType::Utf8, false),
162
+ Field::new("lixcol_file_id", DataType::Utf8, true),
163
+ json_field("lixcol_snapshot_content", true),
164
+ json_field("lixcol_metadata", true),
165
+ Field::new("lixcol_created_at", DataType::Utf8, true),
166
+ Field::new("lixcol_updated_at", DataType::Utf8, true),
167
+ Field::new("lixcol_global", DataType::Boolean, true),
168
+ Field::new("lixcol_change_id", DataType::Utf8, true),
169
+ Field::new("lixcol_commit_id", DataType::Utf8, true),
170
+ Field::new("lixcol_untracked", DataType::Boolean, true),
171
+ ];
172
+ if shape == EntitySurfaceShape::ByBranch {
173
+ fields.push(Field::new("lixcol_branch_id", DataType::Utf8, false));
174
+ }
175
+ fields
176
+ }
177
+
178
+ fn parse_primary_key_paths(schema: &JsonValue) -> Result<Vec<Vec<String>>, LixError> {
179
+ let Some(primary_key) = schema.get("x-lix-primary-key") else {
180
+ return Ok(Vec::new());
181
+ };
182
+ let primary_key = primary_key.as_array().ok_or_else(|| {
183
+ LixError::new(
184
+ "LIX_ERROR_UNKNOWN",
185
+ "schema x-lix-primary-key must be an array of JSON Pointers".to_string(),
186
+ )
187
+ })?;
188
+
189
+ primary_key
190
+ .iter()
191
+ .enumerate()
192
+ .map(|(index, pointer)| {
193
+ let pointer = pointer.as_str().ok_or_else(|| {
194
+ LixError::new(
195
+ "LIX_ERROR_UNKNOWN",
196
+ format!("schema x-lix-primary-key entry at index {index} must be a string"),
197
+ )
198
+ })?;
199
+ parse_json_pointer(pointer)
200
+ })
201
+ .collect()
202
+ }
203
+
204
+ // TODO(engine): share JSON Pointer parsing with schema/canonical validation once
205
+ // those helpers have a clean module boundary for SQL providers.
206
+ fn parse_json_pointer(pointer: &str) -> Result<Vec<String>, LixError> {
207
+ if pointer.is_empty() {
208
+ return Ok(Vec::new());
209
+ }
210
+ if !pointer.starts_with('/') {
211
+ return Err(LixError::new(
212
+ "LIX_ERROR_UNKNOWN",
213
+ format!("invalid JSON pointer '{pointer}'"),
214
+ ));
215
+ }
216
+ pointer[1..]
217
+ .split('/')
218
+ .map(decode_json_pointer_segment)
219
+ .collect()
220
+ }
221
+
222
+ fn decode_json_pointer_segment(segment: &str) -> Result<String, LixError> {
223
+ let mut out = String::new();
224
+ let mut chars = segment.chars();
225
+ while let Some(ch) = chars.next() {
226
+ if ch == '~' {
227
+ match chars.next() {
228
+ Some('0') => out.push('~'),
229
+ Some('1') => out.push('/'),
230
+ _ => {
231
+ return Err(LixError::new(
232
+ "LIX_ERROR_UNKNOWN",
233
+ format!("invalid JSON pointer segment '{segment}'"),
234
+ ))
235
+ }
236
+ }
237
+ } else {
238
+ out.push(ch);
239
+ }
240
+ }
241
+ Ok(out)
242
+ }
243
+
244
+ fn entity_column_type_from_schema(schema: &JsonValue) -> Option<EntityColumnType> {
245
+ let mut kinds = BTreeSet::new();
246
+ collect_entity_type_kinds(schema, &mut kinds);
247
+ kinds.remove("null");
248
+
249
+ if kinds.is_empty() {
250
+ return None;
251
+ }
252
+
253
+ if kinds.len() == 1 {
254
+ return match kinds.into_iter().next() {
255
+ Some("boolean") => Some(EntityColumnType::Boolean),
256
+ Some("integer") => Some(EntityColumnType::Integer),
257
+ Some("number") => Some(EntityColumnType::Number),
258
+ Some("string") => Some(EntityColumnType::String),
259
+ Some("object" | "array") => Some(EntityColumnType::Json),
260
+ _ => None,
261
+ };
262
+ }
263
+
264
+ Some(EntityColumnType::Json)
265
+ }
266
+
267
+ fn arrow_data_type_for_entity_column_type(column_type: EntityColumnType) -> DataType {
268
+ match column_type {
269
+ EntityColumnType::String | EntityColumnType::Json => DataType::Utf8,
270
+ EntityColumnType::Integer => DataType::Int64,
271
+ EntityColumnType::Number => DataType::Float64,
272
+ EntityColumnType::Boolean => DataType::Boolean,
273
+ }
274
+ }
275
+
276
+ fn collect_entity_type_kinds<'a>(schema: &'a JsonValue, out: &mut BTreeSet<&'a str>) {
277
+ match schema.get("type") {
278
+ Some(JsonValue::String(kind)) => {
279
+ out.insert(kind.as_str());
280
+ }
281
+ Some(JsonValue::Array(kinds)) => {
282
+ for kind in kinds.iter().filter_map(JsonValue::as_str) {
283
+ out.insert(kind);
284
+ }
285
+ }
286
+ _ => {}
287
+ }
288
+
289
+ for keyword in ["anyOf", "oneOf", "allOf"] {
290
+ if let Some(JsonValue::Array(branches)) = schema.get(keyword) {
291
+ for branch in branches {
292
+ collect_entity_type_kinds(branch, out);
293
+ }
294
+ }
295
+ }
296
+ }
@@ -0,0 +1,15 @@
1
+ pub(crate) mod capability;
2
+ pub(crate) mod entity_surface;
3
+ pub(crate) mod registry;
4
+ pub(crate) mod schema;
5
+ pub(crate) mod surface;
6
+
7
+ pub(crate) use capability::SurfaceCapabilities;
8
+ pub(crate) use entity_surface::{
9
+ derive_entity_surface_spec_from_schema, entity_surface_schema, entity_system_fields,
10
+ schema_exposed_as_entity_history_surface, schema_exposed_as_entity_surface, EntityColumnType,
11
+ EntitySurfaceShape, EntitySurfaceSpec,
12
+ };
13
+ pub(crate) use registry::PublicCatalog;
14
+ pub(crate) use schema::PublicColumn;
15
+ pub(crate) use surface::{PublicSurfaceContract, PublicSurfaceKind};