omnata-plugin-runtime 0.10.7a254__tar.gz → 0.10.8a256__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/PKG-INFO +1 -1
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/pyproject.toml +1 -1
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/src/omnata_plugin_runtime/json_schema.py +60 -16
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/LICENSE +0 -0
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/README.md +0 -0
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/src/omnata_plugin_runtime/__init__.py +0 -0
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/src/omnata_plugin_runtime/api.py +0 -0
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/src/omnata_plugin_runtime/configuration.py +0 -0
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/src/omnata_plugin_runtime/forms.py +0 -0
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/src/omnata_plugin_runtime/logging.py +0 -0
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/src/omnata_plugin_runtime/omnata_plugin.py +0 -0
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/src/omnata_plugin_runtime/plugin_entrypoints.py +0 -0
- {omnata_plugin_runtime-0.10.7a254 → omnata_plugin_runtime-0.10.8a256}/src/omnata_plugin_runtime/rate_limiting.py +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
[tool.poetry]
|
2
2
|
name = "omnata-plugin-runtime"
|
3
|
-
version = "0.10.
|
3
|
+
version = "0.10.8-a256"
|
4
4
|
description = "Classes and common runtime components for building and running Omnata Plugins"
|
5
5
|
authors = ["James Weakley <james.weakley@omnata.com>"]
|
6
6
|
readme = "README.md"
|
@@ -52,6 +52,9 @@ class JsonSchemaProperty(BaseModel):
|
|
52
52
|
requiredStreamNames: Optional[List[str]] = Field(
|
53
53
|
None, description="The names of the streams that are depended upon by this column, via joins. If these streams are not selected, the column will be omitted."
|
54
54
|
)
|
55
|
+
referencedFields: Optional[Dict[str,List[str]]] = Field(
|
56
|
+
None, description="The names of fields that are referenced by this field, keyed on the stream name (or None if it's the current stream). This is used to order the fields, and also to cascade the removal of unsupported fields (e.g. in formulas)."
|
57
|
+
)
|
55
58
|
|
56
59
|
@model_validator(mode='after')
|
57
60
|
def validate(self) -> Self:
|
@@ -165,6 +168,9 @@ class SnowflakeViewColumn(BaseModel):
|
|
165
168
|
required_stream_names: Optional[List[str]] = Field(
|
166
169
|
default=None, description="The names of the streams that are depended upon by this column, via joins. If these streams are not selected, the column will be omitted"
|
167
170
|
)
|
171
|
+
referenced_columns: Optional[Dict[str,List[str]]] = Field(
|
172
|
+
default=None, description="The names of columns that are referenced by this column, keyed on the stream name (or None if it's the current stream). This is used to order the columns, and also to cascade the removal of unsupported columns (e.g. in formulas)."
|
173
|
+
)
|
168
174
|
|
169
175
|
def __repr__(self) -> str:
|
170
176
|
return "SnowflakeViewColumn(name=%r, definition=%r, comment=%r)" % (
|
@@ -230,19 +236,23 @@ class SnowflakeViewColumn(BaseModel):
|
|
230
236
|
if not json_schema_property.snowflakeColumnExpression:
|
231
237
|
expression=f"""{expression}::{json_schema_property.snowflake_data_type}"""
|
232
238
|
required_stream_names = None
|
239
|
+
referenced_columns = None
|
233
240
|
if json_schema_property.requiredStreamNames:
|
234
241
|
required_stream_names = json_schema_property.requiredStreamNames
|
242
|
+
if json_schema_property.referencedFields:
|
243
|
+
referenced_columns = json_schema_property.referencedFields
|
235
244
|
return cls(
|
236
245
|
name=final_column_name,
|
237
246
|
original_name=column_name,
|
238
247
|
expression=expression,
|
239
248
|
comment=comment,
|
240
249
|
is_join_column=json_schema_property.isJoinColumn,
|
241
|
-
required_stream_names=required_stream_names
|
250
|
+
required_stream_names=required_stream_names,
|
251
|
+
referenced_columns=referenced_columns
|
242
252
|
)
|
243
253
|
|
244
254
|
@classmethod
|
245
|
-
def order_by_reference(cls,columns:List[Self]) -> List[Self]:
|
255
|
+
def order_by_reference(cls,current_stream_name:str,columns:List[Self]) -> List[Self]:
|
246
256
|
"""
|
247
257
|
In some situations, column expressions may reference the alias of another column
|
248
258
|
This is allowed in Snowflake, as long as the aliased column is defined before it's used in a later column
|
@@ -262,7 +272,7 @@ class SnowflakeViewColumn(BaseModel):
|
|
262
272
|
for other_column in columns:
|
263
273
|
if column==other_column:
|
264
274
|
continue
|
265
|
-
if
|
275
|
+
if column.original_name in (other_column.referenced_columns or {}).get(current_stream_name,[]):
|
266
276
|
if column not in columns_to_move:
|
267
277
|
columns_to_move.append(column)
|
268
278
|
|
@@ -413,6 +423,12 @@ class SnowflakeViewPart(BaseModel):
|
|
413
423
|
select {', '.join([c.definition(original_name=original_name) for c in self.direct_columns()])}
|
414
424
|
from {self.raw_table_location.get_fully_qualified_name()}
|
415
425
|
) """
|
426
|
+
|
427
|
+
def columns_missing(self,columns_to_check:List[str]) -> List[str]:
|
428
|
+
"""
|
429
|
+
Returns a list of columns that are missing from the view part.
|
430
|
+
"""
|
431
|
+
return [c for c in columns_to_check if c not in [c.original_name for c in self.columns]]
|
416
432
|
|
417
433
|
class SnowflakeViewParts(BaseModel):
|
418
434
|
"""
|
@@ -484,7 +500,7 @@ class SnowflakeViewParts(BaseModel):
|
|
484
500
|
column_name_environment=column_name_environment,
|
485
501
|
column_name_expression=column_name_expression
|
486
502
|
)
|
487
|
-
joined_parts = []
|
503
|
+
joined_parts:List[SnowflakeViewPart] = []
|
488
504
|
# remove the joins from the main part if they are not in the raw stream locations
|
489
505
|
main_stream_view_part.joins = [join for join in main_stream_view_part.joins
|
490
506
|
if join.join_stream_name in raw_stream_locations
|
@@ -499,21 +515,49 @@ class SnowflakeViewParts(BaseModel):
|
|
499
515
|
column_name_environment=column_name_environment,
|
500
516
|
column_name_expression=column_name_expression
|
501
517
|
))
|
502
|
-
# For each column, the plugin can advise which
|
518
|
+
# For each column, the plugin can advise which fields (of the same stream or joined) are required for the join, which comes through as referenced_columns
|
503
519
|
# on the SnowflakeViewColumn object.
|
504
|
-
# Until this generate function is called with the raw stream names, we don't know which streams the user has actually selected
|
505
|
-
#
|
506
|
-
|
507
|
-
|
508
|
-
|
509
|
-
|
510
|
-
|
511
|
-
|
512
|
-
|
520
|
+
# Until this generate function is called with the raw stream names, we don't know which streams the user has actually selected, nor which
|
521
|
+
# fields are actually available (some may be dropped due to something like an unsupported formula).
|
522
|
+
# So now there's a pruning process where we remove columns that reference fields that are not available.
|
523
|
+
# We'll start by doing a first pass and removing unavailable columns from other streams
|
524
|
+
# then, we can do a final pass and remove columns that reference fields that are not available in the current stream
|
525
|
+
prune_count = 0
|
526
|
+
while prune(main_stream_view_part,joined_parts):
|
527
|
+
prune_count += 1
|
528
|
+
if prune_count > 10000:
|
529
|
+
raise ValueError("Pruning of columns from the view has entered an infinite loop")
|
513
530
|
|
514
531
|
return cls(main_part=main_stream_view_part, joined_parts=joined_parts)
|
515
532
|
|
516
|
-
|
533
|
+
def prune(view_part:SnowflakeViewPart,joined_parts:List[SnowflakeViewPart]) -> bool:
|
534
|
+
"""
|
535
|
+
Prunes columns from the main view part that reference fields that are not available in the joined parts.
|
536
|
+
Returns True if columns were removed, False otherwise.
|
537
|
+
"""
|
538
|
+
for column in view_part.columns:
|
539
|
+
if column.referenced_columns:
|
540
|
+
for referenced_stream_name, referenced_fields in column.referenced_columns.items():
|
541
|
+
|
542
|
+
if referenced_stream_name == view_part.stream_name:
|
543
|
+
part = view_part
|
544
|
+
else:
|
545
|
+
part = next((part for part in joined_parts if part.stream_name==referenced_stream_name),None)
|
546
|
+
if part is None:
|
547
|
+
logger.warning(f"Column {column.name} in stream {view_part.stream_name} references stream {referenced_stream_name}, but it was not provided")
|
548
|
+
view_part.columns.remove(column)
|
549
|
+
return True
|
550
|
+
|
551
|
+
columns_missing_from_join = part.columns_missing(referenced_fields)
|
552
|
+
if len(columns_missing_from_join) > 0:
|
553
|
+
logger.warning(f"Column {column.name} in stream {view_part.stream_name} references fields {columns_missing_from_join} in stream {referenced_stream_name}, but they were not provided")
|
554
|
+
view_part.columns.remove(column)
|
555
|
+
return True
|
556
|
+
else:
|
557
|
+
# no columns were removed, but we need to check if the columns that are referenced are not themselves referencing other missing columns
|
558
|
+
return prune(part,joined_parts)
|
559
|
+
|
560
|
+
return False
|
517
561
|
|
518
562
|
class JsonSchemaTopLevel(BaseModel):
|
519
563
|
"""
|
@@ -679,7 +723,7 @@ def normalized_view_part(
|
|
679
723
|
#- APP_IDENTIFIER
|
680
724
|
#- Direct and joined columns, ordered so that columns that reference other columns are defined after the columns they reference
|
681
725
|
#- OMNATA_RETRIEVE_DATE, OMNATA_RAW_RECORD, OMNATA_IS_DELETED, OMNATA_RUN_ID
|
682
|
-
view_columns = SnowflakeViewColumn.order_by_reference(direct_view_columns +
|
726
|
+
view_columns = SnowflakeViewColumn.order_by_reference(stream_name,direct_view_columns +
|
683
727
|
join_view_columns)
|
684
728
|
return SnowflakeViewPart(
|
685
729
|
stream_name=stream_name,
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|