PyPI - cognite-neat - Versions diffs - 0.107.0__py3-none-any.whl → 0.109.0__py3-none-any.whl - Mend

cognite-neat 0.107.0py3-none-any.whl → 0.109.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of cognite-neat might be problematic. Click here for more details.

Files changed (69) hide show

cognite/neat/_constants.py +35 -1
cognite/neat/_graph/_shared.py +4 -0
cognite/neat/_graph/extractors/_classic_cdf/_base.py +115 -14
cognite/neat/_graph/extractors/_classic_cdf/_classic.py +87 -6
cognite/neat/_graph/extractors/_classic_cdf/_relationships.py +48 -12
cognite/neat/_graph/extractors/_classic_cdf/_sequences.py +19 -1
cognite/neat/_graph/extractors/_dms.py +162 -47
cognite/neat/_graph/extractors/_dms_graph.py +54 -4
cognite/neat/_graph/extractors/_mock_graph_generator.py +1 -1
cognite/neat/_graph/extractors/_rdf_file.py +3 -2
cognite/neat/_graph/loaders/__init__.py +1 -3
cognite/neat/_graph/loaders/_rdf2dms.py +20 -10
cognite/neat/_graph/queries/_base.py +144 -84
cognite/neat/_graph/queries/_construct.py +1 -1
cognite/neat/_graph/transformers/__init__.py +3 -1
cognite/neat/_graph/transformers/_base.py +4 -4
cognite/neat/_graph/transformers/_classic_cdf.py +13 -13
cognite/neat/_graph/transformers/_prune_graph.py +3 -3
cognite/neat/_graph/transformers/_rdfpath.py +3 -4
cognite/neat/_graph/transformers/_value_type.py +71 -13
cognite/neat/_issues/errors/__init__.py +2 -0
cognite/neat/_issues/errors/_external.py +8 -0
cognite/neat/_issues/errors/_resources.py +1 -1
cognite/neat/_issues/warnings/__init__.py +0 -2
cognite/neat/_issues/warnings/_models.py +1 -1
cognite/neat/_issues/warnings/_properties.py +0 -8
cognite/neat/_issues/warnings/_resources.py +1 -1
cognite/neat/_rules/catalog/classic_model.xlsx +0 -0
cognite/neat/_rules/exporters/_rules2instance_template.py +3 -3
cognite/neat/_rules/exporters/_rules2yaml.py +1 -1
cognite/neat/_rules/importers/__init__.py +3 -1
cognite/neat/_rules/importers/_dtdl2rules/spec.py +1 -2
cognite/neat/_rules/importers/_rdf/__init__.py +2 -2
cognite/neat/_rules/importers/_rdf/_base.py +2 -2
cognite/neat/_rules/importers/_rdf/_inference2rules.py +310 -26
cognite/neat/_rules/models/_base_rules.py +22 -11
cognite/neat/_rules/models/dms/_exporter.py +5 -4
cognite/neat/_rules/models/dms/_rules.py +1 -8
cognite/neat/_rules/models/dms/_rules_input.py +4 -0
cognite/neat/_rules/models/information/_rules_input.py +5 -0
cognite/neat/_rules/transformers/__init__.py +10 -3
cognite/neat/_rules/transformers/_base.py +6 -1
cognite/neat/_rules/transformers/_converters.py +530 -364
cognite/neat/_rules/transformers/_mapping.py +4 -4
cognite/neat/_session/_base.py +100 -47
cognite/neat/_session/_create.py +133 -0
cognite/neat/_session/_drop.py +60 -2
cognite/neat/_session/_fix.py +28 -0
cognite/neat/_session/_inspect.py +22 -7
cognite/neat/_session/_mapping.py +8 -8
cognite/neat/_session/_prepare.py +3 -247
cognite/neat/_session/_read.py +138 -17
cognite/neat/_session/_set.py +50 -1
cognite/neat/_session/_show.py +16 -43
cognite/neat/_session/_state.py +53 -52
cognite/neat/_session/_to.py +11 -4
cognite/neat/_session/_wizard.py +1 -1
cognite/neat/_session/exceptions.py +8 -1
cognite/neat/_store/_graph_store.py +301 -146
cognite/neat/_store/_provenance.py +36 -20
cognite/neat/_store/_rules_store.py +253 -267
cognite/neat/_store/exceptions.py +40 -4
cognite/neat/_utils/auth.py +5 -3
cognite/neat/_version.py +1 -1
{cognite_neat-0.107.0.dist-info → cognite_neat-0.109.0.dist-info}/METADATA +1 -1
{cognite_neat-0.107.0.dist-info → cognite_neat-0.109.0.dist-info}/RECORD +69 -67
{cognite_neat-0.107.0.dist-info → cognite_neat-0.109.0.dist-info}/LICENSE +0 -0
{cognite_neat-0.107.0.dist-info → cognite_neat-0.109.0.dist-info}/WHEEL +0 -0
{cognite_neat-0.107.0.dist-info → cognite_neat-0.109.0.dist-info}/entry_points.txt +0 -0

cognite/neat/_graph/transformers/_value_type.py CHANGED Viewed

@@ -4,10 +4,10 @@ from typing import Any, cast
 from urllib.parse import quote
 import rdflib
-from rdflib import RDF, Namespace, URIRef
+from rdflib import RDF, RDFS, Literal, Namespace, URIRef
 from rdflib.query import ResultRow
-from cognite.neat._constants import UNKNOWN_TYPE
+from cognite.neat._constants import NEAT
 from cognite.neat._issues.warnings import PropertyDataTypeConversionWarning
 from cognite.neat._utils.auxiliary import string_to_ideal_type
 from cognite.neat._utils.rdf_ import Triple, get_namespace, remove_namespace_from_uri
@@ -24,7 +24,7 @@ class SplitMultiValueProperty(BaseTransformerStandardised):
     _need_changes = frozenset({})
     def __init__(self, unknown_type: URIRef | None = None) -> None:
-        self.unknown_type = unknown_type or UNKNOWN_TYPE
+        self.unknown_type = unknown_type or NEAT.UnknownType
     def _iterate_query(self) -> str:
         query = """SELECT ?subjectType ?property
@@ -78,8 +78,8 @@ class SplitMultiValueProperty(BaseTransformerStandardised):
         new_property = URIRef(f"{old_property}_{remove_namespace_from_uri(value_type)}")
-        row_output.add_triples.append(cast(Triple, (subject, new_property, object)))
-        row_output.remove_triples.append(cast(Triple, (subject, old_property, object)))
+        row_output.add_triples.add(cast(Triple, (subject, new_property, object)))
+        row_output.remove_triples.add(cast(Triple, (subject, old_property, object)))
         row_output.instances_modified_count += 1
@@ -143,8 +143,8 @@ class ConvertLiteral(BaseTransformerStandardised):
                 PropertyDataTypeConversionWarning(str(instance), self._type_name, self._property_name, str(e)),
                 stacklevel=2,
             )
-        row_output.add_triples.append((instance, self.subject_predicate, rdflib.Literal(converted_value)))  # type: ignore[arg-type]
-        row_output.remove_triples.append((instance, self.subject_predicate, literal))  # type: ignore[arg-type]
+        row_output.add_triples.add((instance, self.subject_predicate, rdflib.Literal(converted_value)))  # type: ignore[arg-type]
+        row_output.remove_triples.add((instance, self.subject_predicate, literal))  # type: ignore[arg-type]
         row_output.instances_modified_count += 1
         return row_output
@@ -221,15 +221,15 @@ class LiteralToEntity(BaseTransformerStandardised):
         namespace = Namespace(get_namespace(instance))  # type: ignore[arg-type]
         entity_type = namespace[self.entity_type]
         new_entity = namespace[f"{self.entity_type}_{quote(value)!s}"]
-        row_output.add_triples.append((new_entity, RDF.type, entity_type))
+        row_output.add_triples.add((new_entity, RDF.type, entity_type))
         row_output.instances_added_count += 1  # we add one new entity
         if self.new_property is not None:
-            row_output.add_triples.append((new_entity, namespace[self.new_property], rdflib.Literal(value)))  # type: ignore[arg-type]
+            row_output.add_triples.add((new_entity, namespace[self.new_property], rdflib.Literal(value)))  # type: ignore[arg-type]
             row_output.instances_modified_count += 1  # we modify the new entity
-        row_output.add_triples.append((instance, self.subject_predicate, new_entity))  # type: ignore[arg-type]
-        row_output.remove_triples.append((instance, self.subject_predicate, literal))  # type: ignore[arg-type]
+        row_output.add_triples.add((instance, self.subject_predicate, new_entity))  # type: ignore[arg-type]
+        row_output.remove_triples.add((instance, self.subject_predicate, literal))  # type: ignore[arg-type]
         row_output.instances_modified_count += 1  # we modify the old entity
         return row_output
@@ -300,8 +300,66 @@ class ConnectionToLiteral(BaseTransformerStandardised):
         instance, object_entity = cast(tuple[URIRef, URIRef], query_result_row)
         value = remove_namespace_from_uri(object_entity)
-        row_output.add_triples.append((instance, self.subject_predicate, rdflib.Literal(value)))
-        row_output.remove_triples.append((instance, self.subject_predicate, object_entity))
+        row_output.add_triples.add((instance, self.subject_predicate, rdflib.Literal(value)))
+        row_output.remove_triples.add((instance, self.subject_predicate, object_entity))
+        row_output.instances_modified_count += 1
+        return row_output
+class SetType(BaseTransformerStandardised):
+    description = "Set the type of an instance based on a property"
+    def __init__(
+        self,
+        subject_type: URIRef,
+        subject_predicate: URIRef,
+        drop_property: bool = False,
+        namespace: Namespace | None = None,
+    ) -> None:
+        self.subject_type = subject_type
+        self.subject_predicate = subject_predicate
+        self.drop_property = drop_property
+        self._namespace = namespace or Namespace(get_namespace(subject_type))
+    def _count_query(self) -> str:
+        query = """SELECT (COUNT(?object) AS ?objectCount)
+                    WHERE {{
+                      ?instance a <{subject_type}> .
+                      ?instance <{subject_predicate}> ?object
+                      FILTER(isLiteral(?object))
+                    }}"""
+        return query.format(subject_type=self.subject_type, subject_predicate=self.subject_predicate)
+    def _skip_count_query(self) -> str:
+        query = """SELECT (COUNT(?object) AS ?objectCount)
+                    WHERE {{
+                      ?instance a <{subject_type}> .
+                      ?instance <{subject_predicate}> ?object
+                      FILTER(isIRI(?object))
+                    }}"""
+        return query.format(subject_type=self.subject_type, subject_predicate=self.subject_predicate)
+    def _iterate_query(self) -> str:
+        query = """SELECT ?instance ?object
+                    WHERE {{
+                      ?instance a <{subject_type}> .
+                      ?instance <{subject_predicate}> ?object
+                      FILTER(isLiteral(?object))
+                    }}"""
+        return query.format(subject_type=self.subject_type, subject_predicate=self.subject_predicate)
+    def operation(self, query_result_row: ResultRow) -> RowTransformationOutput:
+        row_output = RowTransformationOutput()
+        instance, object_literal = cast(tuple[URIRef, Literal], query_result_row)
+        if self.drop_property:
+            row_output.remove_triples.add((instance, self.subject_predicate, object_literal))
+        row_output.remove_triples.add((instance, RDF.type, self.subject_type))
+        new_type = self._namespace[quote(object_literal.toPython())]
+        row_output.add_triples.add((instance, RDF.type, new_type))
+        row_output.add_triples.add((new_type, RDFS.subClassOf, self.subject_type))
         row_output.instances_modified_count += 1
         return row_output

cognite/neat/_issues/errors/__init__.py CHANGED Viewed

@@ -9,6 +9,7 @@ from ._external import (
     FileReadError,
     FileTypeUnexpectedError,
     NeatYamlError,
+    OxigraphStorageLockedError,
 )
 from ._general import NeatImportError, NeatTypeError, NeatValueError, RegexViolationError
 from ._properties import (
@@ -51,6 +52,7 @@ __all__ = [
     "NeatTypeError",
     "NeatValueError",
     "NeatYamlError",
+    "OxigraphStorageLockedError",
     "PropertyDefinitionDuplicatedError",
     "PropertyDefinitionError",
     "PropertyMappingDuplicatedError",

cognite/neat/_issues/errors/_external.py CHANGED Viewed

@@ -23,6 +23,14 @@ class FileReadError(NeatError, RuntimeError):
     reason: str
+@dataclass(unsafe_hash=True)
+class OxigraphStorageLockedError(NeatError, RuntimeError):
+    """Oxigraph on-disk storage locked at the path {filepath}"""
+    fix = "Delete LOCK file in the {filepath} folder to unlock the storage or use another storage path"
+    filepath: Path
 @dataclass(unsafe_hash=True)
 class FileNotFoundNeatError(NeatError, FileNotFoundError):
     """File {filepath} not found"""

cognite/neat/_issues/errors/_resources.py CHANGED Viewed

@@ -30,7 +30,7 @@ class ResourceRetrievalError(ResourceError[T_Identifier]):
 @dataclass(unsafe_hash=True)
 class ResourceNotFoundError(ResourceError, Generic[T_Identifier, T_ReferenceIdentifier]):
-    """The {resource_type} with identifier {identifier} does not exist"""
+    """The {resource_type} with identifier '{identifier}' does not exist"""
     extra = " This is expected by {referred_type} {referred_by}."

cognite/neat/_issues/warnings/__init__.py CHANGED Viewed

@@ -31,7 +31,6 @@ from ._properties import (
     PropertyDirectRelationLimitWarning,
     PropertyNotFoundWarning,
     PropertyOverwritingWarning,
-    PropertySkippedWarning,
     PropertyTypeNotSupportedWarning,
     PropertyValueTypeUndefinedWarning,
 )
@@ -68,7 +67,6 @@ __all__ = [
     "PropertyDirectRelationLimitWarning",
     "PropertyNotFoundWarning",
     "PropertyOverwritingWarning",
-    "PropertySkippedWarning",
     "PropertyTypeNotSupportedWarning",
     "PropertyValueTypeUndefinedWarning",
     "RegexViolationWarning",

cognite/neat/_issues/warnings/_models.py CHANGED Viewed

@@ -74,7 +74,7 @@ class CDFNotSupportedWarning(NeatWarning, ABC):
 class NotSupportedViewContainerLimitWarning(CDFNotSupportedWarning):
     """The view {view_id} maps, {count} containers, which is more than the limit {limit}."""
-    fix = "Reduce the number of containers the view maps to." ""
+    fix = "Reduce the number of containers the view maps to."
     view_id: ViewId
     count: int

cognite/neat/_issues/warnings/_properties.py CHANGED Viewed

@@ -65,14 +65,6 @@ class PropertyOverwritingWarning(PropertyWarning[T_Identifier]):
     overwriting: tuple[str, ...]
-@dataclass(unsafe_hash=True)
-class PropertySkippedWarning(PropertyWarning[T_Identifier]):
-    """The {resource_type} with identifier {identifier} has a property {property_name}
-    which is skipped. {reason}."""
-    reason: str
 @dataclass(unsafe_hash=True)
 class PropertyDataTypeConversionWarning(PropertyWarning[T_Identifier]):
     """The {resource_type} with identifier {identifier} failed to convert the property {property_name}: {error}"""

cognite/neat/_issues/warnings/_resources.py CHANGED Viewed

@@ -21,7 +21,7 @@ class ResourceRegexViolationWarning(ResourceNeatWarning):
     fix = (
         "Either export the data model and make the necessary changes manually"
-        " or run prepare.data_model.cdf_compliant_external_ids."
+        " or run fix.data_model.cdf_compliant_external_ids."
     )
     location: str

cognite/neat/_rules/catalog/classic_model.xlsx CHANGED Viewed

Binary file

cognite/neat/_rules/exporters/_rules2instance_template.py CHANGED Viewed

@@ -96,13 +96,13 @@ class InstanceTemplateExporter(BaseExporter[InformationRules, Workbook]):
 def _add_index_identifiers(workbook: Workbook, sheet: str, no_rows: int):
     """Adds index-based auto identifier to a sheet identifier column"""
     for i in range(no_rows):
-        workbook[sheet][f"A{i+2}"] = f'=IF(ISBLANK(B{i+2}), "","{sheet}-{i+1}")'
+        workbook[sheet][f"A{i + 2}"] = f'=IF(ISBLANK(B{i + 2}), "","{sheet}-{i + 1}")'
 def _add_uuid_identifiers(workbook: Workbook, sheet: str, no_rows: int):
     """Adds UUID-based auto identifier to a sheet identifier column"""
     for i in range(no_rows):
-        workbook[sheet][f"A{i+2}"] = f'=IF(ISBLANK(B{i+2}), "","{sheet}-{uuid.uuid4()}")'
+        workbook[sheet][f"A{i + 2}"] = f'=IF(ISBLANK(B{i + 2}), "","{sheet}-{uuid.uuid4()}")'
 def _add_drop_down_list(
@@ -122,7 +122,7 @@ def _add_drop_down_list(
     workbook[sheet].add_data_validation(drop_down_list)
     for i in range(no_rows):
-        drop_down_list.add(workbook[sheet][f"{column}{i+2}"])
+        drop_down_list.add(workbook[sheet][f"{column}{i + 2}"])
 def _adjust_column_width(workbook: Workbook):

cognite/neat/_rules/exporters/_rules2yaml.py CHANGED Viewed

@@ -72,7 +72,7 @@ class YAMLExporter(BaseExporter[VerifiedRules, str]):
         """
         # model_dump_json ensures that the output is in JSON format,
         # if we don't do this, we will get Enums and other types that are not serializable to YAML
-        json_output = rules.dump(mode="json", exclude_none=True, exclude_unset=True)
+        json_output = rules.dump(mode="json", sort=True, exclude_none=True, exclude_unset=True)
         if self.output == "json":
             return json.dumps(json_output)
         elif self.output == "yaml":

cognite/neat/_rules/importers/__init__.py CHANGED Viewed

@@ -1,7 +1,7 @@
 from ._base import BaseImporter
 from ._dms2rules import DMSImporter
 from ._dtdl2rules import DTDLImporter
-from ._rdf import IMFImporter, InferenceImporter, OWLImporter
+from ._rdf import IMFImporter, InferenceImporter, OWLImporter, SubclassInferenceImporter
 from ._spreadsheet2rules import ExcelImporter, GoogleSheetImporter
 from ._yaml2rules import YAMLImporter
@@ -14,6 +14,7 @@ __all__ = [
     "IMFImporter",
     "InferenceImporter",
     "OWLImporter",
+    "SubclassInferenceImporter",
     "YAMLImporter",
 ]
@@ -26,6 +27,7 @@ RulesImporters = (
     | DTDLImporter
     | YAMLImporter
     | InferenceImporter
+    | SubclassInferenceImporter
 )

cognite/neat/_rules/importers/_dtdl2rules/spec.py CHANGED Viewed

@@ -302,8 +302,7 @@ class Interface(DTDLBase):
     spec_version = frozenset(["2", "3"])
     default_context: ClassVar[IRI] = Field(
         "dtmi:dtdl:context;3",
-        description="This can be set directly on the class to change the "
-        "default context used when parsing a document.",
+        description="This can be set directly on the class to change the default context used when parsing a document.",
     )
     id_: DTMI = Field(alias="@id")  # type: ignore[assignment]
     context: IRI | None = Field(alias="@context")

cognite/neat/_rules/importers/_rdf/__init__.py CHANGED Viewed

@@ -1,5 +1,5 @@
 from ._imf2rules import IMFImporter
-from ._inference2rules import InferenceImporter
+from ._inference2rules import InferenceImporter, SubclassInferenceImporter
 from ._owl2rules import OWLImporter
-__all__ = ["IMFImporter", "InferenceImporter", "OWLImporter"]
+__all__ = ["IMFImporter", "InferenceImporter", "OWLImporter", "SubclassInferenceImporter"]

cognite/neat/_rules/importers/_rdf/_base.py CHANGED Viewed

@@ -72,7 +72,7 @@ class BaseRDFImporter(BaseImporter[InformationInputRules]):
     ):
         return cls(
             IssueList(title=f"{cls.__name__} issues"),
-            store.graph,
+            store.dataset,
             data_model_id=data_model_id,
             max_number_of_instance=max_number_of_instance,
             non_existing_node_type=non_existing_node_type,
@@ -140,7 +140,7 @@ class BaseRDFImporter(BaseImporter[InformationInputRules]):
             prefixes: Dict of prefixes and namespaces
         """
         if Namespace(get_namespace(URI)) not in prefixes.values():
-            prefixes[f"prefix_{len(prefixes)+1}"] = Namespace(get_namespace(URI))
+            prefixes[f"prefix_{len(prefixes) + 1}"] = Namespace(get_namespace(URI))
     @property
     def _metadata(self) -> dict:

cognite-neat 0.107.0__py3-none-any.whl → 0.109.0__py3-none-any.whl

Potentially problematic release.

cognite-neat 0.107.0py3-none-any.whl → 0.109.0py3-none-any.whl