PyPI - compiled-knowledge - Versions diffs - 4.0.0a16__cp312-cp312-win_amd64.whl → 4.0.0a18__cp312-cp312-win_amd64.whl - Mend

compiled-knowledge 4.0.0a16__cp312-cp312-win_amd64.whl → 4.0.0a18__cp312-cp312-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of compiled-knowledge might be problematic. Click here for more details.

Files changed (36) hide show

ck/circuit_compiler/cython_vm_compiler/_compiler.pyx CHANGED Viewed

@@ -1,17 +1,15 @@
 from __future__ import annotations
-from pickletools import long1
-from typing import Sequence, Dict, List, Tuple, Set, Optional, Iterator
+from typing import Dict, Tuple, Sequence
 import numpy as np
 import ctypes as ct
 from ck import circuit
-from ck.circuit import CircuitNode, ConstNode, VarNode, OpNode, ADD, Circuit
+from ck.circuit import OpNode, VarNode, CircuitNode
 from ck.circuit_compiler.support.circuit_analyser import CircuitAnalysis, analyze_circuit
-from ck.circuit_compiler.support.input_vars import infer_input_vars, InputVars
-from ck.program.raw_program import RawProgram, RawProgramFunction
-from ck.utils.np_extras import DType, NDArrayNumeric, NDArray, DTypeNumeric
+from ck.program.raw_program import RawProgramFunction
+from ck.utils.np_extras import NDArrayNumeric, DTypeNumeric
 from cpython.mem cimport PyMem_Malloc, PyMem_Realloc, PyMem_Free
@@ -63,21 +61,21 @@ def make_function(
 # VM instructions
-ADD = circuit.ADD
-MUL = circuit.MUL
-COPY: int = max(ADD, MUL) + 1
+cdef int ADD = circuit.ADD
+cdef int MUL = circuit.MUL
+cdef int COPY = max(ADD, MUL) + 1
 # VM arrays
-VARS: int = 0
-TMPS: int = 1
-CONSTS: int = 2
-RESULT: int = 3
+cdef int VARS = 0
+cdef int TMPS = 1
+cdef int CONSTS = 2
+cdef int RESULT = 3
-def _make_instructions_from_analysis(
-        analysis: CircuitAnalysis,
-        dtype: DTypeNumeric,
-) -> Tuple[Instructions, NDArrayNumeric]:
+cdef tuple[Instructions, cnp.ndarray] _make_instructions_from_analysis(
+        object analysis: CircuitAnalysis,
+        object dtype: DTypeNumeric,
+): # -> Tuple[Instructions, NDArrayNumeric]:
     if dtype != np.float64:
         raise RuntimeError(f'only DType {np.float64} currently supported')
@@ -91,7 +89,7 @@ def _make_instructions_from_analysis(
         np_consts[i] = node.value
     # Where to get input values for each possible node.
-    node_to_element: Dict[int, ElementID] = {}
+    cdef dict[int, ElementID] node_to_element  = {}
     # const nodes
     for node_id, const_idx in node_to_const_idx.items():
         node_to_element[node_id] = ElementID(CONSTS, const_idx)
@@ -110,21 +108,16 @@ def _make_instructions_from_analysis(
     # Build instructions
     instructions: Instructions = Instructions()
-    op_node: OpNode
+    cdef object op_node
     for op_node in analysis.op_nodes:
-        dest: ElementID = node_to_element[id(op_node)]
-        args: list[ElementID] = [
-            node_to_element[id(arg)]
-            for arg in op_node.args
-        ]
-        instructions.append(op_node.symbol, args, dest)
+        instructions.append_op(op_node.symbol, op_node, node_to_element)
     # Add any copy operations, i.e., result nodes that are not op nodes
     for i, node in enumerate(analysis.result_nodes):
         if not isinstance(node, OpNode):
             dest: ElementID = ElementID(RESULT, i)
-            args: list[ElementID] = [node_to_element[id(node)]]
-            instructions.append(COPY, args, dest)
+            src: ElementID = node_to_element[id(node)]
+            instructions.append_copy(src, dest)
     return instructions, np_consts
@@ -136,39 +129,70 @@ cdef struct ElementID:
 cdef struct Instruction:
     int             symbol  # ADD, MUL, COPY
-    int             num_args
+    Py_ssize_t      num_args
     ElementID*      args
     ElementID       dest
 cdef class Instructions:
     cdef Instruction* instructions
+    cdef int allocated
     cdef int num_instructions
-    def __init__(self):
-        self.instructions = <Instruction*> PyMem_Malloc(0)
+    def __init__(self) -> None:
         self.num_instructions = 0
+        self.allocated = 64
+        self.instructions = <Instruction*> PyMem_Malloc(self.allocated * sizeof(Instruction))
+    cdef void append_copy(
+            self,
+            ElementID src,
+            ElementID dest,
+    ) except*:
+        c_args = <ElementID*> PyMem_Malloc(sizeof(ElementID))
+        if not c_args:
+            raise MemoryError()
-    def append(self, int symbol, list[ElementID] args, ElementID dest) -> None:
-        cdef int num_args = len(args)
-        cdef int i
+        c_args[0] = src
+        self._append(COPY, 1, c_args, dest)
+    cdef void append_op(self, int symbol, object op_node: OpNode, dict[int, ElementID] node_to_element) except*:
+        args = op_node.args
+        cdef Py_ssize_t num_args = len(args)
-        c_args = <ElementID*> PyMem_Malloc(
-            num_args * sizeof(ElementID))
+        # Create the instruction arguments array
+        c_args = <ElementID*> PyMem_Malloc(num_args * sizeof(ElementID))
         if not c_args:
             raise MemoryError()
-        for i in range(num_args):
-            c_args[i] = args[i]
+        cdef Py_ssize_t i = num_args
+        while i > 0:
+            i -= 1
+            c_args[i] = node_to_element[id(args[i])]
+        dest: ElementID = node_to_element[id(op_node)]
+        self._append(symbol, num_args, c_args, dest)
+    cdef void _append(self, int symbol, Py_ssize_t num_args, ElementID* c_args, ElementID dest) except *:
+        cdef int i
         cdef int num_instructions = self.num_instructions
-        self.instructions = <Instruction*> PyMem_Realloc(
-            self.instructions,
-            sizeof(Instruction) * (num_instructions + 1)
-        )
-        if not self.instructions:
-            raise MemoryError()
+        # Ensure sufficient instruction memory
+        cdef int allocated = self.allocated
+        if num_instructions == allocated:
+            allocated *= 2
+            self.instructions = <Instruction*> PyMem_Realloc(
+                self.instructions,
+                allocated * sizeof(Instruction),
+            )
+            if not self.instructions:
+                raise MemoryError()
+            self.allocated = allocated
+        # Add the instruction
         self.instructions[num_instructions] = Instruction(
             symbol,
             num_args,
@@ -177,7 +201,7 @@ cdef class Instructions:
         )
         self.num_instructions = num_instructions + 1
-    def __dealloc__(self):
+    def __dealloc__(self) -> None:
         cdef Instruction* instructions = self.instructions
         if instructions:
             for i in range(self.num_instructions):
@@ -194,15 +218,16 @@ cdef void cvm_float64(
     double* consts,
     double* result,
     Instructions instructions,
-):
-    # Core virtual machine.
+) except *:
+    # Core virtual machine (for dtype float64).
-    cdef int i, num_args, symbol
+    cdef int symbol
+    cdef Py_ssize_t i
     cdef double accumulator
     cdef ElementID* args
-    cdef ElementID elem
+    cdef ElementID  elem
-    # index the four arrays by constants VARS, TMPS, CONSTS, and RESULT
+    # Index the four arrays by constants VARS, TMPS, CONSTS, and RESULT
     cdef (double*) arrays[4]
     arrays[VARS] = vars_in
     arrays[TMPS] = tmps
@@ -210,29 +235,32 @@ cdef void cvm_float64(
     arrays[RESULT] = result
     cdef Instruction* instruction_ptr = instructions.instructions
-    for _ in range(instructions.num_instructions):
+    cdef int num_instructions = instructions.num_instructions
-        symbol = instruction_ptr[0].symbol
-        args = instruction_ptr[0].args
-        num_args = instruction_ptr[0].num_args
+    while num_instructions > 0:
+        num_instructions -= 1
+        symbol = instruction_ptr.symbol
+        args = instruction_ptr.args
         elem = args[0]
         accumulator = arrays[elem.array][elem.index]
         if symbol == ADD:
-            for i in range(1, num_args):
+            i = instruction_ptr.num_args
+            while i > 1:
+                i -= 1
                 elem = args[i]
                 accumulator += arrays[elem.array][elem.index]
         elif symbol == MUL:
-            for i in range(1, num_args):
+            i = instruction_ptr.num_args
+            while i > 1:
+                i -= 1
                 elem = args[i]
                 accumulator *= arrays[elem.array][elem.index]
-        elif symbol == COPY:
-            pass
-        else:
-            raise RuntimeError('symbol not understood: ' + str(symbol))
+        # else symbol == COPY, nothing to do
-        elem = instruction_ptr[0].dest
+        elem = instruction_ptr.dest
         arrays[elem.array][elem.index] = accumulator
         # Advance the instruction pointer

ck/circuit_compiler/named_circuit_compilers.py CHANGED Viewed

@@ -54,4 +54,4 @@ class NamedCircuitCompiler(Enum):
         return self.value[0]
-DEFAULT_CIRCUIT_COMPILER: NamedCircuitCompiler = NamedCircuitCompiler.LLVM_VM
+DEFAULT_CIRCUIT_COMPILER: NamedCircuitCompiler = NamedCircuitCompiler.CYTHON_VM

ck/pgm_compiler/factor_elimination.py CHANGED Viewed

@@ -149,7 +149,7 @@ def join_tree_to_circuit(
         limit_product_tree_search,
     )
     top: CircuitNode = top_table.top()
-    top_table.circuit.remove_unreachable_op_nodes(top)
+    top.circuit.remove_unreachable_op_nodes(top)
     return PGMCircuit(
         rvs=tuple(pgm.rvs),
@@ -169,27 +169,37 @@ def _circuit_tables_from_join_tree(
 ) -> CircuitTable:
     """
     This is a basic algorithm for constructing a circuit table from a join tree.
+    Algorithm synopsis:
+    1) Get a CircuitTable for each factor allocated to this join tree node, and
+       for each child of the join tree node (recursive call to _circuit_tables_from_join_tree).
+    2) Form a binary tree of the collected circuit tables.
+    3) Perform table products and sum-outs for each node in the binary tree, which should
+       leave a single circuit table with a single row.
     """
-    # The PGM factors allocated to this join tree node
-    factors: List[CircuitTable] = [
-        factor_tables.get_table(factor)
-        for factor in join_tree.factors
-    ]
-    # The children of this join tree node
-    factors.extend(
-        _circuit_tables_from_join_tree(factor_tables, child, limit_product_tree_search)
-        for child in join_tree.children
+    # Get all the factors to combine.
+    factors: List[CircuitTable] = list(
+        chain(
+            (
+                # The PGM factors allocated to this join tree node
+                factor_tables.get_table(factor)
+                for factor in join_tree.factors
+            ),
+            (
+                # The children of this join tree node
+                _circuit_tables_from_join_tree(factor_tables, child, limit_product_tree_search)
+                for child in join_tree.children
+            ),
+        )
     )
     # The usual join tree approach just forms the product all the tables in `factors`.
     # The tree width is not affected by the order of products, however some orders
     # lead to smaller numbers of arithmetic operations.
     #
-    # If `options.optimise_products` is true, then heuristics are used
+    # If `limit_product_tree_search > 1`, then heuristics are used
     # reduce the number of arithmetic operations.
-    # Deal with the special case: no factors
+    # Deal with the special case: zero factors
     if len(factors) == 0:
         circuit = factor_tables.circuit
         if len(join_tree.separator) == 0:

ck/pgm_compiler/support/circuit_table/__init__.py CHANGED Viewed

@@ -1,5 +1,12 @@
-# from .circuit_table_py import (
-from .circuit_table import (
+# There are two implementations of the `circuit_table` module are provided
+# for developer R&D purposes. One is pure Python and the other is Cython.
+# Which implementation is used can be selected here.
+# A similar selection can be made for the `circuit` module.
+# Note that if the Cython implementation is chosen for `circuit_table` then
+# the Cython implementation must be chosen for `circuit`.
+# from ._circuit_table_py import (
+from ._circuit_table_cy import (
     CircuitTable,
     TableInstance,
     sum_out,

ck/pgm_compiler/support/circuit_table/_circuit_table_cy.cp312-win_amd64.pyd ADDED Viewed

Binary file

ck/pgm_compiler/support/circuit_table/_circuit_table_cy.pyx ADDED Viewed

@@ -0,0 +1,332 @@
+from __future__ import annotations
+from typing import Sequence, Tuple, Iterable
+from ck.circuit import MUL, ADD
+from ck.circuit._circuit_cy cimport Circuit, CircuitNode
+cdef int c_ADD = ADD
+cdef int c_MUL = MUL
+TableInstance = Tuple[int, ...]
+cdef class CircuitTable:
+    """
+    A circuit table manages a set of CircuitNodes, where each node corresponds
+    to an instance for a set of (zero or more) random variables.
+    Operations on circuit tables typically add circuit nodes to the circuit. It will
+    heuristically avoid adding unnecessary nodes (e.g. addition of zero, multiplication
+    by zero or one.) However, it may be that interim circuit nodes are created that
+    end up not being used. Consider calling `Circuit.remove_unreachable_op_nodes` after
+    completing all circuit table operations.
+    It is generally expected that no CircuitTable row will be created with a constant
+    zero node. These are assumed to be optimised out already.
+    """
+    cdef public Circuit circuit
+    cdef public tuple[int, ...] rv_idxs
+    cdef dict[tuple[int, ...], CircuitNode] rows
+    def __init__(
+            self,
+            circuit: Circuit,
+            rv_idxs: Sequence[int],
+            rows: Iterable[Tuple[TableInstance, CircuitNode]] = (),
+    ):
+        """
+        Args:
+            circuit: the circuit whose nodes are being managed by this table.
+            rv_idxs: indexes of random variables.
+            rows: optional rows to add to the table.
+        Assumes:
+            * rv_idxs contains no duplicates.
+            * all row instances conform to the indexed random variables.
+            * all row circuit nodes belong to the given circuit.
+        """
+        self.circuit = circuit
+        self.rv_idxs = tuple(rv_idxs)
+        self.rows = dict(rows)
+    def __len__(self) -> int:
+        return len(self.rows)
+    def get(self, key, default=None):
+        return self.rows.get(key, default)
+    def keys(self) -> Iterable[CircuitNode]:
+        return self.rows.keys()
+    def values(self) -> Iterable[tuple[int, ...]]:
+        return self.rows.values()
+    def __getitem__(self, key):
+        return self.rows[key]
+    def __setitem__(self, key, value):
+        self.rows[key] = value
+    cpdef CircuitNode top(self):
+        # Get the circuit top value.
+        #
+        # Raises:
+        #     RuntimeError if there is more than one row in the table.
+        #
+        # Returns:
+        #     A single circuit node.
+        cdef int number_of_rows = len(self.rows)
+        if number_of_rows == 0:
+            return self.circuit.zero
+        elif number_of_rows == 1:
+            return next(iter(self.rows.values()))
+        else:
+            raise RuntimeError('cannot get top node from a table with more that 1 row')
+# ==================================================================================
+#  Circuit Table Operations
+# ==================================================================================
+cpdef CircuitTable sum_out(CircuitTable table, object rv_idxs: Iterable[int]):
+    # Return a circuit table that results from summing out
+    # the given random variables of this circuit table.
+    #
+    # Normally this will return a new table. However, if rv_idxs is empty,
+    # then the given table is returned unmodified.
+    #
+    # Raises:
+    #     ValueError if rv_idxs is not a subset of table.rv_idxs.
+    #     ValueError if rv_idxs contains duplicates.
+    cdef tuple[int, ...] rv_idxs_seq = tuple(rv_idxs)
+    if len(rv_idxs_seq) == 0:
+        # nothing to do
+        return table
+    cdef set[int] rv_idxs_set = set(rv_idxs_seq)
+    if len(rv_idxs_set) != len(rv_idxs_seq):
+        raise ValueError('rv_idxs contains duplicates')
+    if not rv_idxs_set.issubset(table.rv_idxs):
+        raise ValueError('rv_idxs is not a subset of table.rv_idxs')
+    cdef int rv_index
+    cdef list[int] remaining_rv_idxs = []
+    for rv_index in table.rv_idxs:
+        if rv_index not in rv_idxs_set:
+            remaining_rv_idxs.append(rv_index)
+    cdef int num_remaining = len(remaining_rv_idxs)
+    if num_remaining == 0:
+        # Special case: summing out all random variables
+        return sum_out_all(table)
+    # index_map[i] is the location in table.rv_idxs for remaining_rv_idxs[i]
+    cdef list[int] index_map = []
+    for rv_index in remaining_rv_idxs:
+        index_map.append(_find(table.rv_idxs, rv_index))
+    cdef dict[tuple[int, ...], list[CircuitNode]] groups = {}
+    cdef object got
+    cdef list[int] group_instance
+    cdef tuple[int, ...] group_instance_tuple
+    cdef int i
+    cdef CircuitNode node
+    cdef tuple[int, ...] instance
+    for instance, node in table.rows.items():
+        group_instance = []
+        for i in index_map:
+            group_instance.append(instance[i])
+        group_instance_tuple = tuple(group_instance)
+        got = groups.get(group_instance_tuple)
+        if got is None:
+            groups[group_instance_tuple] = [node]
+        else:
+            got.append(node)
+    cdef Circuit circuit = table.circuit
+    cdef CircuitTable new_table = CircuitTable(circuit, remaining_rv_idxs)
+    cdef dict[tuple[int, ...], CircuitNode] rows = new_table.rows
+    for group_instance_tuple, to_add in groups.items():
+        node = circuit.op(c_ADD, tuple(to_add))
+        if not node.is_zero:
+            rows[group_instance_tuple] = node
+    return new_table
+cpdef CircuitTable sum_out_all(CircuitTable table):
+    # Return a circuit table that results from summing out
+    # all random variables of this circuit table.
+    circuit: Circuit = table.circuit
+    num_rows: int = len(table)
+    if num_rows == 0:
+        return CircuitTable(circuit, ())
+    elif num_rows == 1:
+        node = next(iter(table.rows.values()))
+    else:
+        node: CircuitNode = circuit.op(c_ADD, tuple(table.rows.values()))
+        if node.is_zero:
+            return CircuitTable(circuit, ())
+    return CircuitTable(circuit, (), [((), node)])
+cpdef CircuitTable project(CircuitTable table: CircuitTable, object rv_idxs: Iterable[int]):
+    # Call `sum_out(table, to_sum_out)`, where
+    # `to_sum_out = table.rv_idxs - rv_idxs`.
+    cdef set[int] to_sum_out = set(table.rv_idxs)
+    to_sum_out.difference_update(rv_idxs)
+    return sum_out(table, to_sum_out)
+cpdef CircuitTable product(CircuitTable x, CircuitTable y):
+    # Return a circuit table that results from the product of the two given tables.
+    #
+    # If x or y equals `one_table`, then the other table is returned. Otherwise,
+    # a new circuit table will be constructed and returned.
+    cdef int i
+    cdef Circuit circuit = x.circuit
+    if y.circuit is not circuit:
+        raise ValueError('circuit tables must refer to the same circuit')
+    # Make the smaller table 'y', and the other 'x'.
+    # This is to minimise the index size on 'y'.
+    if len(x) < len(y):
+        x, y = y, x
+    # Special case: y == 0 or 1, and has no random variables.
+    if len(y.rv_idxs) == 0:
+        if len(y) == 1 and y.top().is_one:
+            return x
+        elif len(y) == 0:
+            return CircuitTable(circuit, x.rv_idxs)
+    # Set operations on rv indexes. After these operations:
+    # * co_rv_idxs is the set of rv indexes common (co) to x and y,
+    # * yo_rv_idxs is the set of rv indexes in y only (yo), and not in x.
+    cdef set[int] yo_rv_idxs_set = set(y.rv_idxs)
+    cdef set[int] co_rv_idxs_set = set(x.rv_idxs)
+    co_rv_idxs_set.intersection_update(yo_rv_idxs_set)
+    yo_rv_idxs_set.difference_update(co_rv_idxs_set)
+    if len(co_rv_idxs_set) == 0:
+        # Special case: no common random variables.
+        return _product_no_common_rvs(x, y)
+    # Convert random variable index sets to sequences
+    cdef tuple[int, ...] yo_rv_idxs = tuple(yo_rv_idxs_set)  # y only random variables
+    cdef tuple[int, ...] co_rv_idxs = tuple(co_rv_idxs_set)  # common random variables
+    # Cache mappings from result Instance to index into source Instance (x or y).
+    # This will be used in indexing and product loops to pull our needed values
+    # from the source instances.
+    cdef list[int] co_from_x_map = []
+    cdef list[int] co_from_y_map = []
+    cdef list[int] yo_from_y_map = []
+    for rv_index in co_rv_idxs:
+        co_from_x_map.append(_find(x.rv_idxs, rv_index))
+        co_from_y_map.append(_find(y.rv_idxs, rv_index))
+    for rv_index in yo_rv_idxs:
+        yo_from_y_map.append(_find(y.rv_idxs, rv_index))
+    cdef list[int] co
+    cdef list[int] yo
+    cdef object got
+    cdef tuple[int, ...] co_tuple
+    cdef tuple[int, ...] yo_tuple
+    cdef CircuitTable table = CircuitTable(circuit, x.rv_idxs + yo_rv_idxs)
+    cdef dict[tuple[int, ...], CircuitNode] rows = table.rows
+    # Index the y rows by common-only key (y is the smaller of the two tables).
+    cdef dict[tuple[int, ...], list[tuple[tuple[int, ...], CircuitNode]]] y_index = {}
+    for y_instance, y_node in y.rows.items():
+        co = []
+        yo = []
+        for i in co_from_y_map:
+            co.append(y_instance[i])
+        for i in yo_from_y_map:
+            yo.append(y_instance[i])
+        co_tuple = tuple(co)
+        yo_tuple = tuple(yo)
+        got = y_index.get(co_tuple)
+        if got is None:
+            y_index[co_tuple] = [(yo_tuple, y_node)]
+        else:
+            got.append((yo_tuple, y_node))
+    # Iterate over x rows, inserting (instance, value).
+    # Rows with constant node values of one are optimised out.
+    for x_instance, x_node in x.rows.items():
+        co = []
+        for i in co_from_x_map:
+            co.append(x_instance[i])
+        co_tuple = tuple(co)
+        if x_node.is_one:
+            # Multiplying by one.
+            # Iterate over matching y rows.
+            got = y_index.get(co_tuple)
+            if got is not None:
+                for yo_tuple, y_node in got:
+                    rows[x_instance + yo_tuple] = y_node
+        else:
+            # Iterate over matching y rows.
+            got = y_index.get(co_tuple)
+            if got is not None:
+                for yo_tuple, y_node in got:
+                    if y_node.is_one:
+                        rows[x_instance + yo_tuple] = x_node
+                    else:
+                        rows[x_instance + yo_tuple] = circuit.op(c_MUL, (x_node, y_node))
+    return table
+cdef int _find(tuple[int, ...] xs, int x):
+    cdef int i
+    for i in range(len(xs)):
+        if xs[i] == x:
+            return i
+    # Very unexpected
+    raise RuntimeError('not found')
+cdef CircuitTable _product_no_common_rvs(CircuitTable x, CircuitTable y):
+    # Return the product of x and y, where x and y have no common random variables.
+    #
+    # This is an optimisation of more general product algorithm as no index needs
+    # to be construction based on the common random variables.
+    #
+    # Rows with constant node values of one are optimised out.
+    #
+    # Assumes:
+    #     * There are no common random variables between x and y.
+    #     * x and y are for the same circuit.
+    cdef Circuit circuit = x.circuit
+    cdef CircuitTable table = CircuitTable(circuit, x.rv_idxs + y.rv_idxs)
+    cdef tuple[int, ...] instance
+    for x_instance, x_node in x.rows.items():
+        if x_node.is_one:
+            for y_instance, y_node in y.rows.items():
+                instance = x_instance + y_instance
+                table.rows[instance] = y_node
+        else:
+            for y_instance, y_node in y.rows.items():
+                instance = x_instance + y_instance
+                if y_node.is_one:
+                    table.rows[instance] = x_node
+                else:
+                    table.rows[instance] = circuit.op(c_MUL, (x_node, y_node))
+    return table