PyPI - relationalai - Versions diffs - 1.0.0a3__py3-none-any.whl → 1.0.0a5__py3-none-any.whl - Mend

relationalai 1.0.0a3py3-none-any.whl → 1.0.0a5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (118) hide show

relationalai/config/config.py +47 -21
relationalai/config/connections/__init__.py +5 -2
relationalai/config/connections/duckdb.py +2 -2
relationalai/config/connections/local.py +31 -0
relationalai/config/connections/snowflake.py +0 -1
relationalai/config/external/raiconfig_converter.py +235 -0
relationalai/config/external/raiconfig_models.py +202 -0
relationalai/config/external/utils.py +31 -0
relationalai/config/shims.py +1 -0
relationalai/semantics/__init__.py +10 -8
relationalai/semantics/backends/sql/sql_compiler.py +1 -4
relationalai/semantics/experimental/__init__.py +0 -0
relationalai/semantics/experimental/builder.py +295 -0
relationalai/semantics/experimental/builtins.py +154 -0
relationalai/semantics/frontend/base.py +67 -42
relationalai/semantics/frontend/core.py +34 -6
relationalai/semantics/frontend/front_compiler.py +209 -37
relationalai/semantics/frontend/pprint.py +6 -2
relationalai/semantics/metamodel/__init__.py +7 -0
relationalai/semantics/metamodel/metamodel.py +2 -0
relationalai/semantics/metamodel/metamodel_analyzer.py +58 -16
relationalai/semantics/metamodel/pprint.py +6 -1
relationalai/semantics/metamodel/rewriter.py +11 -7
relationalai/semantics/metamodel/typer.py +116 -41
relationalai/semantics/reasoners/__init__.py +11 -0
relationalai/semantics/reasoners/graph/__init__.py +35 -0
relationalai/semantics/reasoners/graph/core.py +9028 -0
relationalai/semantics/std/__init__.py +30 -10
relationalai/semantics/std/aggregates.py +641 -12
relationalai/semantics/std/common.py +146 -13
relationalai/semantics/std/constraints.py +71 -1
relationalai/semantics/std/datetime.py +904 -21
relationalai/semantics/std/decimals.py +143 -2
relationalai/semantics/std/floats.py +57 -4
relationalai/semantics/std/integers.py +98 -4
relationalai/semantics/std/math.py +857 -35
relationalai/semantics/std/numbers.py +216 -20
relationalai/semantics/std/re.py +213 -5
relationalai/semantics/std/strings.py +437 -44
relationalai/shims/executor.py +60 -52
relationalai/shims/fixtures.py +85 -0
relationalai/shims/helpers.py +26 -2
relationalai/shims/hoister.py +28 -9
relationalai/shims/mm2v0.py +204 -173
relationalai/tools/cli/cli.py +192 -10
relationalai/tools/cli/components/progress_reader.py +1 -1
relationalai/tools/cli/docs.py +394 -0
relationalai/tools/debugger.py +11 -4
relationalai/tools/qb_debugger.py +435 -0
relationalai/tools/typer_debugger.py +1 -2
relationalai/util/dataclasses.py +3 -5
relationalai/util/docutils.py +1 -2
relationalai/util/error.py +2 -5
relationalai/util/python.py +23 -0
relationalai/util/runtime.py +1 -2
relationalai/util/schema.py +2 -4
relationalai/util/structures.py +4 -2
relationalai/util/tracing.py +8 -2
{relationalai-1.0.0a3.dist-info → relationalai-1.0.0a5.dist-info}/METADATA +8 -5
{relationalai-1.0.0a3.dist-info → relationalai-1.0.0a5.dist-info}/RECORD +118 -95
{relationalai-1.0.0a3.dist-info → relationalai-1.0.0a5.dist-info}/WHEEL +1 -1
v0/relationalai/__init__.py +1 -1
v0/relationalai/clients/client.py +52 -18
v0/relationalai/clients/exec_txn_poller.py +122 -0
v0/relationalai/clients/local.py +23 -8
v0/relationalai/clients/resources/azure/azure.py +36 -11
v0/relationalai/clients/resources/snowflake/__init__.py +4 -4
v0/relationalai/clients/resources/snowflake/cli_resources.py +12 -1
v0/relationalai/clients/resources/snowflake/direct_access_resources.py +124 -100
v0/relationalai/clients/resources/snowflake/engine_service.py +381 -0
v0/relationalai/clients/resources/snowflake/engine_state_handlers.py +35 -29
v0/relationalai/clients/resources/snowflake/error_handlers.py +43 -2
v0/relationalai/clients/resources/snowflake/snowflake.py +277 -179
v0/relationalai/clients/resources/snowflake/use_index_poller.py +8 -0
v0/relationalai/clients/types.py +5 -0
v0/relationalai/errors.py +19 -1
v0/relationalai/semantics/lqp/algorithms.py +173 -0
v0/relationalai/semantics/lqp/builtins.py +199 -2
v0/relationalai/semantics/lqp/executor.py +68 -37
v0/relationalai/semantics/lqp/ir.py +28 -2
v0/relationalai/semantics/lqp/model2lqp.py +215 -45
v0/relationalai/semantics/lqp/passes.py +13 -658
v0/relationalai/semantics/lqp/rewrite/__init__.py +12 -0
v0/relationalai/semantics/lqp/rewrite/algorithm.py +385 -0
v0/relationalai/semantics/lqp/rewrite/constants_to_vars.py +70 -0
v0/relationalai/semantics/lqp/rewrite/deduplicate_vars.py +104 -0
v0/relationalai/semantics/lqp/rewrite/eliminate_data.py +108 -0
v0/relationalai/semantics/lqp/rewrite/extract_keys.py +25 -3
v0/relationalai/semantics/lqp/rewrite/period_math.py +77 -0
v0/relationalai/semantics/lqp/rewrite/quantify_vars.py +65 -31
v0/relationalai/semantics/lqp/rewrite/unify_definitions.py +317 -0
v0/relationalai/semantics/lqp/utils.py +11 -1
v0/relationalai/semantics/lqp/validators.py +14 -1
v0/relationalai/semantics/metamodel/builtins.py +2 -1
v0/relationalai/semantics/metamodel/compiler.py +2 -1
v0/relationalai/semantics/metamodel/dependency.py +12 -3
v0/relationalai/semantics/metamodel/executor.py +11 -1
v0/relationalai/semantics/metamodel/factory.py +2 -2
v0/relationalai/semantics/metamodel/helpers.py +7 -0
v0/relationalai/semantics/metamodel/ir.py +3 -2
v0/relationalai/semantics/metamodel/rewrite/dnf_union_splitter.py +30 -20
v0/relationalai/semantics/metamodel/rewrite/flatten.py +50 -13
v0/relationalai/semantics/metamodel/rewrite/format_outputs.py +9 -3
v0/relationalai/semantics/metamodel/typer/checker.py +6 -4
v0/relationalai/semantics/metamodel/typer/typer.py +4 -3
v0/relationalai/semantics/metamodel/visitor.py +4 -3
v0/relationalai/semantics/reasoners/optimization/solvers_dev.py +1 -1
v0/relationalai/semantics/reasoners/optimization/solvers_pb.py +336 -86
v0/relationalai/semantics/rel/compiler.py +2 -1
v0/relationalai/semantics/rel/executor.py +3 -2
v0/relationalai/semantics/tests/lqp/__init__.py +0 -0
v0/relationalai/semantics/tests/lqp/algorithms.py +345 -0
v0/relationalai/tools/cli.py +339 -186
v0/relationalai/tools/cli_controls.py +216 -67
v0/relationalai/tools/cli_helpers.py +410 -6
v0/relationalai/util/format.py +5 -2
{relationalai-1.0.0a3.dist-info → relationalai-1.0.0a5.dist-info}/entry_points.txt +0 -0
{relationalai-1.0.0a3.dist-info → relationalai-1.0.0a5.dist-info}/top_level.txt +0 -0

v0/relationalai/semantics/lqp/rewrite/__init__.py CHANGED Viewed

@@ -1,18 +1,30 @@
+from .algorithm import AlgorithmPass
 from .annotate_constraints import AnnotateConstraints
 from .cdc import CDC
+from .constants_to_vars import ConstantsToVars
+from .deduplicate_vars import DeduplicateVars
+from .eliminate_data import EliminateData
 from .extract_common import ExtractCommon
 from .extract_keys import ExtractKeys
 from .function_annotations import FunctionAnnotations, SplitMultiCheckRequires
+from .period_math import PeriodMath
 from .quantify_vars import QuantifyVars
 from .splinter import Splinter
+from .unify_definitions import UnifyDefinitions
 __all__ = [
+    "AlgorithmPass",
     "AnnotateConstraints",
     "CDC",
+    "ConstantsToVars",
+    "DeduplicateVars",
+    "EliminateData",
     "ExtractCommon",
     "ExtractKeys",
     "FunctionAnnotations",
+    "PeriodMath",
     "QuantifyVars",
     "Splinter",
     "SplitMultiCheckRequires",
+    "UnifyDefinitions",
 ]

v0/relationalai/semantics/lqp/rewrite/algorithm.py ADDED Viewed

@@ -0,0 +1,385 @@
+from collections import defaultdict
+from typing import Optional, TypeGuard, Union, cast
+from v0.relationalai.semantics.metamodel import ir, helpers, factory
+from v0.relationalai.semantics.metamodel.compiler import Pass
+from v0.relationalai.semantics.metamodel.visitor import Visitor, Rewriter, collect_by_type
+from v0.relationalai.semantics.lqp.algorithms import (
+    is_script, is_algorithm_script,is_logical_instruction, is_update_instruction,
+    get_instruction_head_rels, get_instruction_body_rels, mk_assign, split_instruction
+)
+class AlgorithmPass(Pass):
+    """
+    Transforms algorithm scripts by normalizing Loopy constructs (iterative algorithm).
+    This pass applies three main rewriting transformations to Metamodel IR that prepare
+    algorithm scripts for execution, in the order listed below:
+    1. *Intermediate Rescoping*: Moves nested logical intermediate relations from their
+       original logical scope into algorithm scripts, placing them immediately before each
+       instruction that uses them (which can include Break instructions). Removes
+       intermediates from the logical scope if they're only used within algorithms.
+       TODO: Monitor https://github.com/RelationalAI/relationalai-python/pull/3187
+       Example (Metamodel IR):
+           BEFORE:
+               Logical
+                   Logical
+                       R(x::Int128, y::Int128)
+                       → derive _nested_logical_1(x::Int128, y::Int128) @assign
+                   Sequence @script @algorithm
+                       Logical
+                           _nested_logical_1(a::Int128, b::Int128)
+                           → derive S(a::Int128, b::Int128) @assign
+           AFTER:
+               Logical
+                   Sequence @script @algorithm
+                       Logical
+                           R(x::Int128, y::Int128)
+                           → derive _nested_logical_1(x::Int128, y::Int128) @assign
+                       Logical
+                           _nested_logical_1(a::Int128, b::Int128)
+                           → derive S(a::Int128, b::Int128) @assign
+    2. **Update Normalization**: Transforms Loopy update operations (@upsert, @monoid, @monus)
+       to use a single body atom. Complex bodies with multiple lookups or additional
+       operations are normalized by introducing intermediate relations.
+       Example (Metamodel IR):
+           BEFORE:
+               Logical
+                   R(x::Int128, y::Int128)
+                   S(y::Int128, z::Int128)
+                   → derive T(x::Int128, z::Int128) @upsert
+           AFTER:
+               Logical
+                   R(x::Int128, y::Int128)
+                   S(y::Int128, z::Int128)
+                   → derive _loopy_update_intermediate_1(x::Int128, z::Int128) @assign
+               Logical
+                   _loopy_update_intermediate_1(x::Int128, z::Int128)
+                   → derive T(x::Int128, z::Int128) @upsert
+    3. **Recursive Assignment Decoupling**: Decouples self-referential assignments where the
+       head relation appears in the body by introducing a copy relation. This transformation
+       is required for BackIR analysis compatibility.
+       Example (Metamodel IR):
+           BEFORE:
+               Logical
+                   iter(i::Int128)
+                   rel_primitive_int128_add(i::Int128, 1::Int128, i_plus_1::Int128)
+                   → derive iter(i_plus_1::Int128) @assign
+           AFTER:
+               Logical
+                   iter(i::Int128)
+                   → derive _loopy_iter_copy_1(i::Int128) @assign
+               Logical
+                   _loopy_iter_copy_1(i::Int128)
+                   rel_primitive_int128_add(i::Int128, 1::Int128, i_plus_1::Int128)
+                   → derive iter(i_plus_1::Int128) @assign
+    """
+    def rewrite(self, model: ir.Model, options:dict={}) -> ir.Model:
+        # Find all nested logical intermediates
+        intermediate_finder = FindIntermediates()
+        model.accept(intermediate_finder)
+        intermediate_analyzer = AnalyzeIntermediateUse(set(intermediate_finder.intermediates.keys()))
+        model.accept(intermediate_analyzer)
+        # Determine which intermediates to move and which to remove
+        uses_intermediates: dict[Union[ir.Logical, ir.Break], set[ir.Logical]] = defaultdict(set)
+        remove_declarations: set[ir.Logical] = set()
+        for rel, decl in intermediate_finder.intermediates.items():
+            if rel not in intermediate_analyzer.used_outside_algorithm:
+                remove_declarations.add(decl)
+            for instr in intermediate_analyzer.used_in_alg_instruction[rel]:
+                uses_intermediates[instr].add(decl)
+        # Rescope intermediates
+        rescoper = IntermediateRescoper(uses_intermediates, remove_declarations)
+        model = rescoper.walk(model)
+        # Normalize Loopy updates
+        normalizer = UpdateNormalizer()
+        model = normalizer.walk(model)
+        # Decompose recursive assignments
+        decomposer = RecursiveAssignmentDecoupling()
+        model = decomposer.walk(model)
+        return model
+class FindIntermediates(Visitor):
+    """
+    Gathers all `_nested_logical.*` intermediates defined in a Logical scope (where order
+    doesn't matter); in particular DOES NOT gather any intermediates declared in the scope
+    of a Sequence.
+    """
+    def __init__(self):
+        self.intermediates: dict[ir.Relation, ir.Logical] = dict()
+        self._inside_algorithm: bool = False
+    def visit_logical(self, node: ir.Logical, parent: Optional[ir.Node]):
+        if is_logical_instruction(node):
+            heads = get_instruction_head_rels(node)
+            for rel in heads:
+                if rel.name.startswith("_nested_logical"):
+                    self.intermediates[rel] = node
+        else:
+            super().visit_logical(node, parent)
+    def visit_sequence(self, node: ir.Sequence, parent: Optional[ir.Node]):
+        if is_algorithm_script(node):
+            self._inside_algorithm = True
+        super().visit_sequence(node, parent)
+        if is_algorithm_script(node):
+            self._inside_algorithm = False
+class AnalyzeIntermediateUse(Visitor):
+    """
+    Identifies, for each nested logical intermediate, the algorithm instructions that
+    use it. Additionally, determines whether the intermediate is used anywhere
+    outside of an algorithm.
+    """
+    def __init__(self, intermediate_relations: set[ir.Relation]):
+        self.intermediates = intermediate_relations
+        self.used_in_algorithm: set[ir.Relation] = set()
+        self.used_in_alg_instruction: dict[ir.Relation, set[Union[ir.Logical, ir.Break]]] = {rel: set() for rel in intermediate_relations}
+        self.used_outside_algorithm: set[ir.Relation] = set()
+        self._current_algorithm: Optional[ir.Sequence] = None
+    def register_use(self, instr: Union[ir.Logical, ir.Break], uses_intermediates: set[ir.Relation]):
+        # this instruction uses intermediates
+        if self._current_algorithm is not None:
+            # instruction is inside an algorithm
+            for rel in uses_intermediates:
+                self.used_in_algorithm.add(rel)
+                self.used_in_alg_instruction[rel].add(instr)
+        else:
+            self.used_outside_algorithm.update(uses_intermediates)
+    def visit_break(self, node: ir.Break, parent: Optional[ir.Node]):
+        lookups = collect_by_type(ir.Lookup, node)
+        lookup_rels = {lookup.relation for lookup in lookups}
+        uses_intermediates = lookup_rels.intersection(self.intermediates)
+        self.register_use(node, uses_intermediates)
+        super().visit_break(node, parent)
+    def visit_logical(self, node: ir.Logical, parent: Optional[ir.Node]):
+        if is_logical_instruction(node):
+            body = get_instruction_body_rels(node)
+            uses_intermediates = body.intersection(self.intermediates)
+            self.register_use(node, uses_intermediates)
+        else:
+            super().visit_logical(node, parent)
+    def visit_sequence(self, node: ir.Sequence, parent: Optional[ir.Node]):
+        if is_algorithm_script(node):
+            self._current_algorithm = node
+        super().visit_sequence(node, parent)
+        if is_algorithm_script(node):
+            self._current_algorithm = None
+class IntermediateRescoper(Rewriter):
+    """
+    Moves nested logical intermediates used in algorithm instructions from the logical scope
+    to any algorithm using the instruction before every instruction that uses them. Removes
+    an intermediate from the logical scope if it is not used anywhere else.
+    * `uses_intermediates`: a mapping from algorithm instructions to the set of nested logical
+      intermediates they use.
+    * `remove_declarations`: the set of nested logical intermediates to remove from the
+      logical scope because they are not used anywhere else.
+    """
+    def __init__(self,
+                 uses_intermediates: dict[Union[ir.Logical, ir.Break], set[ir.Logical]],
+                 remove_declarations: set[ir.Logical]):
+        super().__init__()
+        self.uses_intermediates = uses_intermediates
+        self.remove_declarations = remove_declarations
+    def handle_logical(self, node: ir.Logical, parent: ir.Node) -> ir.Logical:
+        body = []
+        for child in node.body:
+            if child in self.remove_declarations:
+                continue
+            child = self.walk(child, node)
+            body.append(child)
+        return node.reconstruct(node.engine, node.hoisted, tuple(body), node.annotations)
+    def handle_sequence(self, node: ir.Sequence, parent: ir.Node) -> ir.Sequence:
+        tasks = []
+        for child in node.tasks:
+            if child in self.uses_intermediates:
+                assert isinstance(child, (ir.Logical, ir.Break))
+                for intermediate in self.uses_intermediates[child]:
+                    tasks.append(mk_assign(intermediate))
+            child = self.walk(child, node)
+            tasks.append(child)
+        return node.reconstruct(node.engine, node.hoisted, tuple(tasks), node.annotations)
+class UpdateNormalizer(Rewriter):
+    """
+    This pass normalizes Loopy Update operations (upsert, monoid, and monus) to use a single
+    atom in their body. For any Update operation with more complex body, it introduces a new
+    intermediate relation to hold the body results.
+    """
+    def __init__(self):
+        super().__init__()
+        self._inside_algorithm: bool = False
+        self._intermediate_counter: int = 0
+    # Tests if the given Update operation requires normalization
+    # * the body has more than one Lookup operation, or
+    # * the body has other tasks than Lookup and Update
+    def _requires_update_normalization(self, update: ir.Task) -> bool:
+        if not isinstance(update, ir.Logical):
+            return False
+        if not is_update_instruction(update):
+            return False
+        _, lookups, others = split_instruction(update)
+        return len(lookups) > 1 or len(others) > 0
+    def handle_sequence(self, node: ir.Sequence, parent: ir.Node) -> ir.Sequence:
+        if is_algorithm_script(node):
+            self._inside_algorithm = True
+        if self._inside_algorithm:
+            new_tasks = []
+            for task in node.tasks:
+                if self._requires_update_normalization(task):
+                    assert isinstance(task, ir.Logical)
+                    intermediate, normalized_update = self._normalize_update_instruction(task)
+                    new_tasks.extend((intermediate, normalized_update))
+                else:
+                    new_tasks.append(self.walk(task, node))
+            result = node.reconstruct(node.engine, node.hoisted, tuple(new_tasks), node.annotations)
+        else:
+            result = super().handle_sequence(node, parent)
+        if is_algorithm_script(node):
+            self._inside_algorithm = False
+        return result
+    def _normalize_update_instruction(self, update_instr: ir.Logical) -> tuple[ir.Logical, ir.Logical]:
+        update, lookups, others = split_instruction(update_instr)
+        normalized_update = []
+        var_list = helpers.vars(update.args)
+        intermediate_rel = factory.relation(
+            self._fresh_intermediate_name(), [
+                factory.field(f"arg_{i}", var.type) for i, var in enumerate(var_list)
+            ]
+        )
+        intermediate_derive = factory.derive(intermediate_rel, var_list)
+        intermediate_logical = mk_assign(factory.logical(
+            engine=update_instr.engine,
+            hoisted=update_instr.hoisted,
+            body=(*lookups, *others, intermediate_derive),
+            annos=list(update_instr.annotations)
+        ))
+        assert isinstance(intermediate_logical, ir.Logical)
+        intermediate_lookup = factory.lookup(
+            intermediate_rel,
+            var_list
+        )
+        normalized_update = factory.logical(
+            engine=update_instr.engine,
+            hoisted=update_instr.hoisted,
+            body=(intermediate_lookup, update),
+            annos=list(update_instr.annotations)
+        )
+        return (intermediate_logical, normalized_update)
+    def _fresh_intermediate_name(self) -> str:
+        self._intermediate_counter += 1
+        return f"_loopy_update_intermediate_{self._intermediate_counter}"
+class RecursiveAssignmentDecoupling(Rewriter):
+    """
+    Decouples assignments whose definition is "recursive", i.e., the body contain the head
+    e.g., `assign iter = iter + 1`. Currently, BackIR analysis cannot handle properly such
+    assignments. Such assignments are decoupled by introducing a new intermediate copy
+    relation; in the example above, `assign iter_copy = iter; assign iter = iter_copy + 1`.
+    The performance is not affected because the backend can identify the new assignment as a
+    copy operation and the execution will not lead to materialization of the intermediate
+    relation.
+    """
+    def __init__(self):
+        super().__init__()
+        self._intermediate_copy_counter: int = 0
+        # control of head_rel -> copy_rel substitution in traversal
+        self._perform_substitution: bool = False
+        self._head_rel: Optional[ir.Relation] = None
+        self._copy_rel: Optional[ir.Relation] = None
+    def _fresh_copy_rel_name(self, rel_name:str) -> str:
+        self._intermediate_copy_counter += 1
+        return f"_loopy_{rel_name}_copy_{self._intermediate_copy_counter}"
+    def handle_sequence(self, node: ir.Sequence, parent: ir.Node) -> ir.Sequence:
+        if is_script(node):
+            new_tasks = []
+            for task in node.tasks:
+                if self._is_recursive_assignment(task):
+                    assert isinstance(task, ir.Logical)
+                    intermediate_copy, decomposed_assign = self._decouple_recursive_assignment(task, parent)
+                    new_tasks.extend((intermediate_copy, decomposed_assign))
+                else:
+                    new_tasks.append(self.walk(task, node))
+            return node.reconstruct(node.engine, node.hoisted, tuple(new_tasks), node.annotations)
+        else:
+            return super().handle_sequence(node, parent)
+    def _is_recursive_assignment(self, task: ir.Task) -> TypeGuard[ir.Logical]:
+        if is_logical_instruction(task):
+            heads = get_instruction_head_rels(task)
+            body = get_instruction_body_rels(task)
+            return len(body & heads) > 0
+        return False
+    def _decouple_recursive_assignment(self, rule: ir.Logical, parent: ir.Node) -> tuple[ir.Logical, ir.Logical]:
+        # we have `assign rel(x,...) = ..., rel(y,...), ...`
+        update, _, _ = split_instruction(rule)
+        self._head_rel = update.relation
+        copy_rel_name = self._fresh_copy_rel_name(self._head_rel.name)
+        self._copy_rel = factory.relation(copy_rel_name, list(self._head_rel.fields))
+        # build `assign copy_rel(x,...) = rel(x,...)`
+        copy_rule = cast(ir.Logical, mk_assign(
+            factory.logical([
+                factory.lookup(self._head_rel,update.args),
+                factory.update(self._copy_rel, update.args, update.effect)
+            ])
+        ))
+        # build `assign rel(x,...) = ..., copy_rel(y,...), ...``
+        self._perform_substitution = True
+        rewritten_rule = self.walk(rule, parent)
+        self._perform_substitution = False
+        self._head_rel = None
+        self._copy_rel = None
+        return (copy_rule, rewritten_rule)
+    def handle_lookup(self, node: ir.Lookup, parent: ir.Node) -> ir.Lookup:
+        if self._perform_substitution and node.relation == self._head_rel:
+            assert self._copy_rel is not None
+            return factory.lookup(self._copy_rel, node.args)
+        return super().handle_lookup(node, parent)

v0/relationalai/semantics/lqp/rewrite/constants_to_vars.py ADDED Viewed

@@ -0,0 +1,70 @@
+from v0.relationalai.semantics.metamodel.compiler import Pass
+from v0.relationalai.semantics.metamodel import ir, builtins as rel_builtins, factory as f, visitor
+from v0.relationalai.semantics.metamodel.typer import typer
+from typing import List, Sequence, Tuple, Union
+# Rewrite constants to vars in Updates. This results in a more normalized format where
+# updates contain only variables. This allows for easier rewrites in later passes.
+class ConstantsToVars(Pass):
+    def rewrite(self, model: ir.Model, options:dict={}) -> ir.Model:
+        r = self.ConstantToVarRewriter()
+        return r.walk(model)
+    # Return 1) a new list of Values with no duplicates (at the object level) and
+    # 2) equalities between any original Value and a deduplicated Value.
+    @staticmethod
+    def replace_constants_with_vars(vals: Sequence[ir.Value]) -> Tuple[List[ir.Value], List[ir.Lookup]]:
+        new_vals = []
+        eqs = []
+        for i, val in enumerate(vals):
+            if isinstance(val, ir.PyValue) or isinstance(val, ir.Literal):
+                # Replace constant with a new Var.
+                typ = typer.to_type(val)
+                assert isinstance(typ, ir.ScalarType), "can only replace scalar constants with vars"
+                new_var = ir.Var(typ, f"{typ.name.lower()}_{i}")
+                new_vals.append(new_var)
+                eqs.append(f.lookup(rel_builtins.eq, [new_var, val]))
+            else:
+                new_vals.append(val)
+        return new_vals, eqs
+    @staticmethod
+    def dedup_update(update: ir.Update) -> List[Union[ir.Update, ir.Lookup]]:
+        deduped_vals, req_lookups = ConstantsToVars.replace_constants_with_vars(update.args)
+        new_update = ir.Update(
+            update.engine,
+            update.relation,
+            tuple(deduped_vals),
+            update.effect,
+            update.annotations,
+        )
+        return req_lookups + [new_update]
+    # Does the actual work.
+    class ConstantToVarRewriter(visitor.Rewriter):
+        def __init__(self):
+            super().__init__()
+        # We implement handle_logical instead of handle_update because in
+        # addition to modifying said update we require new lookups (equality
+        # between original and deduplicated variables).
+        def handle_logical(self, node: ir.Logical, parent: ir.Node):
+            # In order to recurse over subtasks.
+            node = super().handle_logical(node, parent)
+            new_body = []
+            for subtask in node.body:
+                if isinstance(subtask, ir.Update):
+                    new_body.extend(ConstantsToVars.dedup_update(subtask))
+                else:
+                    new_body.append(subtask)
+            return ir.Logical(
+                node.engine,
+                node.hoisted,
+                tuple(new_body),
+                node.annotations
+            )

v0/relationalai/semantics/lqp/rewrite/deduplicate_vars.py ADDED Viewed

@@ -0,0 +1,104 @@
+from v0.relationalai.semantics.metamodel.compiler import Pass
+from v0.relationalai.semantics.metamodel import ir, builtins as rel_builtins, factory as f, visitor
+from v0.relationalai.semantics.metamodel import helpers
+from v0.relationalai.semantics.metamodel.util import FrozenOrderedSet
+from v0.relationalai.semantics.lqp.utils import output_names
+from typing import List, Sequence, Tuple, Union
+# Deduplicate Vars in Updates and Outputs.
+class DeduplicateVars(Pass):
+    def rewrite(self, model: ir.Model, options:dict={}) -> ir.Model:
+        r = self.VarDeduplicator()
+        return r.walk(model)
+    # Return 1) a new list of Values with no duplicates (at the object level) and
+    # 2) equalities between any original Value and a deduplicated Value.
+    @staticmethod
+    def dedup_values(vals: Sequence[ir.Value]) -> Tuple[List[ir.Value], List[ir.Lookup]]:
+        # If a var is seen more than once, it is a duplicate and we will create
+        # a new Var and equate it with the seen one.
+        seen_vars = set()
+        new_vals = []
+        eqs = []
+        for i, val in enumerate(vals):
+            # Duplicates can only occur within Vars.
+            # TODO: we don't know for sure if these are the only relevant cases.
+            if isinstance(val, ir.Default) or isinstance(val, ir.Var):
+                var = val if isinstance(val, ir.Var) else val.var
+                if var in seen_vars:
+                    new_var = ir.Var(var.type, var.name + "_dup_" + str(i))
+                    new_val = new_var if isinstance(val, ir.Var) else ir.Default(new_var, val.value)
+                    new_vals.append(new_val)
+                    eqs.append(f.lookup(rel_builtins.eq, [new_var, var]))
+                else:
+                    seen_vars.add(var)
+                    new_vals.append(val)
+            else:
+                # No possibility of problematic duplication.
+                new_vals.append(val)
+        return new_vals, eqs
+    # Returns a reconstructed output with no duplicate variable objects
+    # (dedup_values) and now necessary equalities between any two previously
+    # duplicate variables.
+    @staticmethod
+    def dedup_output(output: ir.Output) -> List[Union[ir.Output, ir.Lookup]]:
+        vals = helpers.output_values(output.aliases)
+        deduped_vals, req_lookups = DeduplicateVars.dedup_values(vals)
+        # Need the names so we can recombine.
+        alias_names = output_names(output.aliases)
+        new_output = ir.Output(
+            output.engine,
+            FrozenOrderedSet(list(zip(alias_names, deduped_vals))),
+            output.keys,
+            output.annotations,
+        )
+        return req_lookups + [new_output]
+    # Returns a replacement update with no duplicate variable objects
+    # (dedup_values) and now necessary equalities between any two previously
+    # duplicate variables.
+    @staticmethod
+    def dedup_update(update: ir.Update) -> List[Union[ir.Update, ir.Lookup]]:
+        deduped_vals, req_lookups = DeduplicateVars.dedup_values(update.args)
+        new_update = ir.Update(
+            update.engine,
+            update.relation,
+            tuple(deduped_vals),
+            update.effect,
+            update.annotations,
+        )
+        return req_lookups + [new_update]
+    # Does the actual work.
+    class VarDeduplicator(visitor.Rewriter):
+        def __init__(self):
+            super().__init__()
+        # We implement handle_logical instead of handle_update/handle_output
+        # because in addition to modifying said update/output we require new
+        # lookups (equality between original and deduplicated variables).
+        def handle_logical(self, node: ir.Logical, parent: ir.Node):
+            # In order to recurse over subtasks.
+            node = super().handle_logical(node, parent)
+            new_body = []
+            for subtask in node.body:
+                if isinstance(subtask, ir.Output):
+                    new_body.extend(DeduplicateVars.dedup_output(subtask))
+                elif isinstance(subtask, ir.Update):
+                    new_body.extend(DeduplicateVars.dedup_update(subtask))
+                else:
+                    new_body.append(subtask)
+            return ir.Logical(
+                node.engine,
+                node.hoisted,
+                tuple(new_body),
+                node.annotations
+            )

relationalai 1.0.0a3__py3-none-any.whl → 1.0.0a5__py3-none-any.whl

relationalai 1.0.0a3py3-none-any.whl → 1.0.0a5py3-none-any.whl