PyPI - mplang-nightly - Versions diffs - 0.1.dev158__py3-none-any.whl → 0.1.dev268__py3-none-any.whl - Mend

mplang-nightly 0.1.dev158py3-none-any.whl → 0.1.dev268py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (191) hide show

mplang/__init__.py +21 -45
mplang/py.typed +13 -0
mplang/v1/__init__.py +157 -0
mplang/v1/_device.py +602 -0
mplang/{analysis → v1/analysis}/__init__.py +1 -1
mplang/{analysis → v1/analysis}/diagram.py +5 -7
mplang/v1/core/__init__.py +157 -0
mplang/{core → v1/core}/cluster.py +30 -14
mplang/{core → v1/core}/comm.py +5 -1
mplang/{core → v1/core}/context_mgr.py +1 -1
mplang/{core/dtype.py → v1/core/dtypes.py} +44 -2
mplang/{core → v1/core}/expr/__init__.py +7 -7
mplang/{core → v1/core}/expr/ast.py +13 -14
mplang/{core → v1/core}/expr/evaluator.py +65 -24
mplang/{core → v1/core}/expr/printer.py +24 -18
mplang/{core → v1/core}/expr/transformer.py +3 -3
mplang/{core → v1/core}/expr/utils.py +2 -2
mplang/{core → v1/core}/expr/visitor.py +1 -1
mplang/{core → v1/core}/expr/walk.py +1 -1
mplang/{core → v1/core}/interp.py +6 -6
mplang/{core → v1/core}/mpir.py +23 -16
mplang/{core → v1/core}/mpobject.py +6 -6
mplang/{core → v1/core}/mptype.py +13 -10
mplang/{core → v1/core}/pfunc.py +4 -4
mplang/{core → v1/core}/primitive.py +106 -201
mplang/{core → v1/core}/table.py +36 -8
mplang/{core → v1/core}/tensor.py +1 -1
mplang/{core → v1/core}/tracer.py +9 -9
mplang/{api.py → v1/host.py} +38 -6
mplang/v1/kernels/__init__.py +41 -0
mplang/{kernels → v1/kernels}/base.py +1 -1
mplang/v1/kernels/basic.py +240 -0
mplang/{kernels → v1/kernels}/context.py +42 -27
mplang/{kernels → v1/kernels}/crypto.py +44 -37
mplang/v1/kernels/fhe.py +858 -0
mplang/{kernels → v1/kernels}/mock_tee.py +12 -13
mplang/{kernels → v1/kernels}/phe.py +263 -57
mplang/{kernels → v1/kernels}/spu.py +137 -48
mplang/{kernels → v1/kernels}/sql_duckdb.py +12 -15
mplang/{kernels → v1/kernels}/stablehlo.py +30 -23
mplang/v1/kernels/value.py +626 -0
mplang/{ops → v1/ops}/__init__.py +5 -16
mplang/{ops → v1/ops}/base.py +2 -5
mplang/{ops/builtin.py → v1/ops/basic.py} +34 -26
mplang/v1/ops/crypto.py +262 -0
mplang/v1/ops/fhe.py +272 -0
mplang/{ops → v1/ops}/jax_cc.py +33 -68
mplang/v1/ops/nnx_cc.py +168 -0
mplang/{ops → v1/ops}/phe.py +16 -4
mplang/{ops → v1/ops}/spu.py +3 -5
mplang/v1/ops/sql_cc.py +303 -0
mplang/{ops → v1/ops}/tee.py +9 -24
mplang/{protos → v1/protos}/v1alpha1/mpir_pb2.pyi +71 -21
mplang/v1/protos/v1alpha1/value_pb2.py +34 -0
mplang/v1/protos/v1alpha1/value_pb2.pyi +169 -0
mplang/{runtime → v1/runtime}/__init__.py +2 -2
mplang/v1/runtime/channel.py +230 -0
mplang/{runtime → v1/runtime}/cli.py +35 -20
mplang/{runtime → v1/runtime}/client.py +19 -8
mplang/{runtime → v1/runtime}/communicator.py +59 -15
mplang/{runtime → v1/runtime}/data_providers.py +80 -19
mplang/{runtime → v1/runtime}/driver.py +30 -12
mplang/v1/runtime/link_comm.py +196 -0
mplang/{runtime → v1/runtime}/server.py +58 -42
mplang/{runtime → v1/runtime}/session.py +57 -71
mplang/{runtime → v1/runtime}/simulation.py +55 -28
mplang/v1/simp/api.py +353 -0
mplang/{simp → v1/simp}/mpi.py +8 -9
mplang/{simp/__init__.py → v1/simp/party.py} +19 -145
mplang/{simp → v1/simp}/random.py +21 -22
mplang/v1/simp/smpc.py +238 -0
mplang/v1/utils/table_utils.py +185 -0
mplang/v2/__init__.py +424 -0
mplang/v2/backends/__init__.py +57 -0
mplang/v2/backends/bfv_impl.py +705 -0
mplang/v2/backends/channel.py +217 -0
mplang/v2/backends/crypto_impl.py +723 -0
mplang/v2/backends/field_impl.py +454 -0
mplang/v2/backends/func_impl.py +107 -0
mplang/v2/backends/phe_impl.py +148 -0
mplang/v2/backends/simp_design.md +136 -0
mplang/v2/backends/simp_driver/__init__.py +41 -0
mplang/v2/backends/simp_driver/http.py +168 -0
mplang/v2/backends/simp_driver/mem.py +280 -0
mplang/v2/backends/simp_driver/ops.py +135 -0
mplang/v2/backends/simp_driver/state.py +60 -0
mplang/v2/backends/simp_driver/values.py +52 -0
mplang/v2/backends/simp_worker/__init__.py +29 -0
mplang/v2/backends/simp_worker/http.py +354 -0
mplang/v2/backends/simp_worker/mem.py +102 -0
mplang/v2/backends/simp_worker/ops.py +167 -0
mplang/v2/backends/simp_worker/state.py +49 -0
mplang/v2/backends/spu_impl.py +275 -0
mplang/v2/backends/spu_state.py +187 -0
mplang/v2/backends/store_impl.py +62 -0
mplang/v2/backends/table_impl.py +838 -0
mplang/v2/backends/tee_impl.py +215 -0
mplang/v2/backends/tensor_impl.py +519 -0
mplang/v2/cli.py +603 -0
mplang/v2/cli_guide.md +122 -0
mplang/v2/dialects/__init__.py +36 -0
mplang/v2/dialects/bfv.py +665 -0
mplang/v2/dialects/crypto.py +689 -0
mplang/v2/dialects/dtypes.py +378 -0
mplang/v2/dialects/field.py +210 -0
mplang/v2/dialects/func.py +135 -0
mplang/v2/dialects/phe.py +723 -0
mplang/v2/dialects/simp.py +944 -0
mplang/v2/dialects/spu.py +349 -0
mplang/v2/dialects/store.py +63 -0
mplang/v2/dialects/table.py +407 -0
mplang/v2/dialects/tee.py +346 -0
mplang/v2/dialects/tensor.py +1175 -0
mplang/v2/edsl/README.md +279 -0
mplang/v2/edsl/__init__.py +99 -0
mplang/v2/edsl/context.py +311 -0
mplang/v2/edsl/graph.py +463 -0
mplang/v2/edsl/jit.py +62 -0
mplang/v2/edsl/object.py +53 -0
mplang/v2/edsl/primitive.py +284 -0
mplang/v2/edsl/printer.py +119 -0
mplang/v2/edsl/registry.py +207 -0
mplang/v2/edsl/serde.py +375 -0
mplang/v2/edsl/tracer.py +614 -0
mplang/v2/edsl/typing.py +816 -0
mplang/v2/kernels/Makefile +30 -0
mplang/v2/kernels/__init__.py +23 -0
mplang/v2/kernels/gf128.cpp +148 -0
mplang/v2/kernels/ldpc.cpp +82 -0
mplang/v2/kernels/okvs.cpp +283 -0
mplang/v2/kernels/okvs_opt.cpp +291 -0
mplang/v2/kernels/py_kernels.py +398 -0
mplang/v2/libs/collective.py +330 -0
mplang/v2/libs/device/__init__.py +51 -0
mplang/v2/libs/device/api.py +813 -0
mplang/v2/libs/device/cluster.py +352 -0
mplang/v2/libs/ml/__init__.py +23 -0
mplang/v2/libs/ml/sgb.py +1861 -0
mplang/v2/libs/mpc/__init__.py +41 -0
mplang/v2/libs/mpc/_utils.py +99 -0
mplang/v2/libs/mpc/analytics/__init__.py +35 -0
mplang/v2/libs/mpc/analytics/aggregation.py +372 -0
mplang/v2/libs/mpc/analytics/groupby.md +99 -0
mplang/v2/libs/mpc/analytics/groupby.py +331 -0
mplang/v2/libs/mpc/analytics/permutation.py +386 -0
mplang/v2/libs/mpc/common/constants.py +39 -0
mplang/v2/libs/mpc/ot/__init__.py +32 -0
mplang/v2/libs/mpc/ot/base.py +222 -0
mplang/v2/libs/mpc/ot/extension.py +477 -0
mplang/v2/libs/mpc/ot/silent.py +217 -0
mplang/v2/libs/mpc/psi/__init__.py +40 -0
mplang/v2/libs/mpc/psi/cuckoo.py +228 -0
mplang/v2/libs/mpc/psi/okvs.py +49 -0
mplang/v2/libs/mpc/psi/okvs_gct.py +79 -0
mplang/v2/libs/mpc/psi/oprf.py +310 -0
mplang/v2/libs/mpc/psi/rr22.py +344 -0
mplang/v2/libs/mpc/psi/unbalanced.py +200 -0
mplang/v2/libs/mpc/vole/__init__.py +31 -0
mplang/v2/libs/mpc/vole/gilboa.py +327 -0
mplang/v2/libs/mpc/vole/ldpc.py +383 -0
mplang/v2/libs/mpc/vole/silver.py +336 -0
mplang/v2/runtime/__init__.py +15 -0
mplang/v2/runtime/dialect_state.py +41 -0
mplang/v2/runtime/interpreter.py +871 -0
mplang/v2/runtime/object_store.py +194 -0
mplang/v2/runtime/value.py +141 -0
{mplang_nightly-0.1.dev158.dist-info → mplang_nightly-0.1.dev268.dist-info}/METADATA +24 -17
mplang_nightly-0.1.dev268.dist-info/RECORD +180 -0
{mplang_nightly-0.1.dev158.dist-info → mplang_nightly-0.1.dev268.dist-info}/WHEEL +1 -1
mplang/core/__init__.py +0 -92
mplang/device.py +0 -340
mplang/kernels/builtin.py +0 -207
mplang/ops/crypto.py +0 -109
mplang/ops/ibis_cc.py +0 -139
mplang/ops/sql.py +0 -61
mplang/protos/v1alpha1/mpir_pb2_grpc.py +0 -3
mplang/runtime/link_comm.py +0 -131
mplang/simp/smpc.py +0 -201
mplang/utils/table_utils.py +0 -73
mplang_nightly-0.1.dev158.dist-info/RECORD +0 -77
/mplang/{core → v1/core}/mask.py +0 -0
/mplang/{protos → v1/protos}/v1alpha1/mpir_pb2.py +0 -0
/mplang/{runtime → v1/runtime}/exceptions.py +0 -0
/mplang/{runtime → v1/runtime}/http_api.md +0 -0
/mplang/{kernels → v1/simp}/__init__.py +0 -0
/mplang/{utils → v1/utils}/__init__.py +0 -0
/mplang/{utils → v1/utils}/crypto.py +0 -0
/mplang/{utils → v1/utils}/func_utils.py +0 -0
/mplang/{utils → v1/utils}/spu_utils.py +0 -0
{mplang_nightly-0.1.dev158.dist-info → mplang_nightly-0.1.dev268.dist-info}/entry_points.txt +0 -0
{mplang_nightly-0.1.dev158.dist-info → mplang_nightly-0.1.dev268.dist-info}/licenses/LICENSE +0 -0

mplang/v2/libs/mpc/__init__.py ADDED Viewed

@@ -0,0 +1,41 @@
+# Copyright 2025 Ant Group Co., Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""MPC (Multi-Party Computation) library for MPLang2.
+Subpackages:
+- ot: Oblivious Transfer protocols
+- vole: Vector OLE protocols
+- psi: Private Set Intersection
+- analytics: Privacy-preserving analytics
+Example usage:
+    from mplang.v2.libs.mpc import ot_transfer, apply_permutation
+    from mplang.v2.libs.mpc.vole import silver_vole
+    from mplang.v2.libs.mpc.psi import psi_intersect
+"""
+from .analytics.aggregation import rotate_and_sum
+from .analytics.groupby import oblivious_groupby_sum_bfv, oblivious_groupby_sum_shuffle
+from .analytics.permutation import apply_permutation, secure_switch
+from .ot.base import transfer as ot_transfer
+__all__ = [
+    "apply_permutation",
+    "oblivious_groupby_sum_bfv",
+    "oblivious_groupby_sum_shuffle",
+    "ot_transfer",
+    "rotate_and_sum",
+    "secure_switch",
+]

mplang/v2/libs/mpc/_utils.py ADDED Viewed

@@ -0,0 +1,99 @@
+# Copyright 2025 Ant Group Co., Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Utilities for MPC protocols."""
+from __future__ import annotations
+from typing import Any, cast
+import jax.numpy as jnp
+import mplang.v2.edsl as el
+from mplang.v2.dialects import tensor
+def bytes_to_bits(data: el.Object) -> el.Object:
+    """Convert bytes (uint8 tensor) to bits (uint8 tensor of 0s and 1s).
+    Output shape logic: (..., N) -> (..., N * 8)
+    """
+    def _to_bits(arr: Any) -> Any:
+        # View as u8
+        y_u8 = arr.view(jnp.uint8)
+        # Unpack produces Big Endian bits [b7, b6, ..., b0] per byte
+        bits = jnp.unpackbits(y_u8)
+        # Reshape to (N, 8) and flip to get [b0, ..., b7]
+        bits = bits.reshape(-1, 8)
+        bits = jnp.fliplr(bits)
+        return bits.reshape(-1)
+    return cast(el.Object, tensor.run_jax(_to_bits, data))
+def bits_to_bytes(bits: el.Object) -> el.Object:
+    """Convert bits to bytes.
+    Output shape logic: (..., N * 8) -> (..., N)
+    """
+    def _to_bytes(arr: Any) -> Any:
+        return jnp.packbits(arr, axis=-1)
+    return cast(el.Object, tensor.run_jax(_to_bytes, bits))
+def transpose_128(matrix_bits: el.Object) -> el.Object:
+    """Transpose a bit matrix.
+    Just a wrapper for tensor.transpose currently.
+    """
+    return tensor.transpose(matrix_bits, perm=(1, 0))
+class CuckooHash:
+    """Simple Cuckoo Hashing simulation."""
+    def __init__(self, num_bins: int, num_hash_functions: int = 3, stash_size: int = 0):
+        self.num_bins = num_bins
+        self.num_functions = num_hash_functions
+        self.stash_size = stash_size
+    def hash(self, items: el.Object, seed: int) -> el.Object:
+        """Hash items to bin indices."""
+        # We perform hashing.
+        # Note: We return hashes for each function?
+        # Usually simplest cuckoo uses 3 hash functions.
+        # We can return (num_funcs, N) or (N, num_funcs)
+        def _hash_fn(xs: Any, s: int) -> Any:
+            # xs: array of items
+            # Simple hash: (x * s + s) % bins
+            # We want multiple hashes?
+            # For now, let's just return one hash per seed provided (assuming call per seed)
+            # Or if seed is a single int, we might mix it.
+            # Let's assume this function handles one hash instance.
+            res = (xs * s + s) % self.num_bins
+            return res.astype(jnp.int32)
+        # Passing self.num_bins as constant implementation detail inside _hash_fn closure is fine
+        # if using run_jax (as it's compiled).
+        # Actually run_jax recompiles if closure changes?
+        # run_jax supports closures.
+        return cast(el.Object, tensor.run_jax(_hash_fn, items, seed))

mplang/v2/libs/mpc/analytics/__init__.py ADDED Viewed

@@ -0,0 +1,35 @@
+# Copyright 2025 Ant Group Co., Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Privacy-preserving analytics operations.
+Submodules:
+- aggregation: BFV homomorphic aggregation
+- groupby: Oblivious Group-By operations
+- permutation: Secure permutation (Bitonic Sort)
+"""
+from .aggregation import aggregate_sparse, batch_bucket_aggregate, rotate_and_sum
+from .groupby import oblivious_groupby_sum_bfv, oblivious_groupby_sum_shuffle
+from .permutation import apply_permutation, secure_switch
+__all__ = [
+    "aggregate_sparse",
+    "apply_permutation",
+    "batch_bucket_aggregate",
+    "oblivious_groupby_sum_bfv",
+    "oblivious_groupby_sum_shuffle",
+    "rotate_and_sum",
+    "secure_switch",
+]

mplang/v2/libs/mpc/analytics/aggregation.py ADDED Viewed

@@ -0,0 +1,372 @@
+# Copyright 2025 Ant Group Co., Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Homomorphic Aggregation library.
+This module implements efficient aggregation algorithms using BFV rotation.
+"""
+from __future__ import annotations
+import math
+from typing import Any
+import numpy as np
+from mplang.v2.dialects import bfv, tensor
+def _safe_rotate(
+    ciphertext: Any, step: int, galois_keys: Any, max_step: int = 1024
+) -> Any:
+    """Rotate ciphertext by step, decomposing large steps if needed.
+    SEAL's rotate_rows requires step to be in range (-slot_count/2, slot_count/2).
+    For poly_modulus_degree=4096, slot_count=4096, max valid step is 2047.
+    We use a conservative max_step=1024 by default for safety.
+    For large steps, we decompose into multiple rotations:
+    - rotate(x, 3000) = rotate(rotate(rotate(x, 1024), 1024), 952)
+    """
+    if step == 0:
+        return ciphertext
+    if abs(step) <= max_step:
+        return bfv.rotate(ciphertext, step, galois_keys)
+    # Decompose large step into multiple rotations
+    current = ciphertext
+    remaining = abs(step)
+    sign = 1 if step > 0 else -1
+    while remaining > 0:
+        rot = min(remaining, max_step)
+        current = bfv.rotate(current, sign * rot, galois_keys)
+        remaining -= rot
+    return current
+def _rotate_and_sum_row(
+    ciphertext: Any, k: int, galois_keys: Any, max_step: int = 1024
+) -> Any:
+    """Sum first k elements within a single row (k <= row_size).
+    Uses the recursive doubling algorithm with O(log k) rotations.
+    """
+    if k <= 1:
+        return ciphertext
+    num_steps = math.ceil(math.log2(k))
+    current = ciphertext
+    for i in range(num_steps):
+        step = 1 << i
+        if step >= k:
+            break
+        rotated = _safe_rotate(current, step, galois_keys, max_step)
+        current = bfv.add(current, rotated)
+    return current
+def rotate_and_sum(
+    ciphertext: Any, k: int, galois_keys: Any, slot_count: int = 4096
+) -> Any:
+    """Aggregate the first k elements of a ciphertext using O(log k) rotations.
+    The result is placed in the 0-th slot.
+    This assumes the input ciphertext has relevant data in slots 0..k-1
+    and zeros (or irrelevant data) elsewhere, OR that the caller will mask the result.
+    Args:
+        ciphertext: The BFV ciphertext.
+        k: The number of elements to sum.
+        galois_keys: Keys required for rotation.
+        slot_count: Total number of slots (default 4096 for poly_degree=4096).
+    Returns:
+        Ciphertext where slot 0 contains sum(ciphertext[0..k-1]).
+    Note:
+        SEAL batching arranges slots as 2 rows of slot_count/2 each.
+        - rotate_rows rotates within each row (circular)
+        - rotate_columns swaps the two rows
+        For k <= row_size (2048), only row rotations are needed.
+        For k > row_size, we use rotate_columns to aggregate across rows.
+    """
+    row_size = slot_count // 2
+    if k <= row_size:
+        # Simple case: all elements in row 0
+        return _rotate_and_sum_row(ciphertext, k, galois_keys)
+    # k > row_size: data spans both rows
+    # Strategy:
+    # 1. Sum row 0 completely (row_size elements)
+    # 2. rotate_columns to bring row 1 to row 0 position
+    # 3. Sum the first (k - row_size) elements of what was row 1
+    # 4. Add the two partial sums
+    # Sum row 0 completely
+    row0_sum = _rotate_and_sum_row(ciphertext, row_size, galois_keys)
+    # Rotate columns: swap row 0 <-> row 1
+    # Now row 1's data is in row 0 position
+    col_rotated = bfv.rotate_columns(ciphertext, galois_keys)
+    # Sum the first (k - row_size) elements (originally in row 1)
+    row1_count = k - row_size
+    row1_sum = _rotate_and_sum_row(col_rotated, row1_count, galois_keys)
+    # Both row0_sum and row1_sum have their results in slot 0
+    # Add them together
+    return bfv.add(row0_sum, row1_sum)
+def aggregate_sparse(
+    ciphertext: Any,
+    aggregations: list[tuple[int, list[int]]],
+    galois_keys: Any,
+    encoder: Any,
+    vector_size: int,
+) -> Any:
+    """Perform sparse aggregation.
+    Args:
+        ciphertext: Input ciphertext.
+        aggregations: List of (target_slot, [source_slots]).
+                      e.g. [(0, [0, 3, 8]), (1, [1, 5])]
+        galois_keys: Rotation keys.
+        encoder: BFV encoder for encoding masks.
+        vector_size: Total size of the vector (slots).
+    Returns:
+        Ciphertext with aggregated results in target slots.
+    """
+    # Naive approach: For each target, sum sources.
+    # Optimized approach:
+    # 1. Decompose into rotations.
+    #    For target t, source s: need rotation by (t-s).
+    #    Group by rotation amount.
+    # 2. Apply rotations and accumulate.
+    # Map: rotation_amount -> mask
+    # We want to compute: Result = Sum( Rotate(Input, r) * Mask_r )
+    # where Mask_r has 1 at slot t if (t - r) is a source for t.
+    # Example: t=0, s={0, 3, 8}.
+    #   s=0: rot=0. Mask[0]=1.
+    #   s=3: rot=-3. Mask[0]=1.
+    #   s=8: rot=-8. Mask[0]=1.
+    # Example: t=1, s={1, 5}.
+    #   s=1: rot=0. Mask[1]=1.
+    #   s=5: rot=-4. Mask[1]=1.
+    # Combined:
+    # Rot 0: Mask[0]=1, Mask[1]=1. -> Mask = [1, 1, 0...]
+    # Rot -3: Mask[0]=1. -> Mask = [1, 0...]
+    # Rot -8: Mask[0]=1. -> Mask = [1, 0...]
+    # Rot -4: Mask[1]=1. -> Mask = [0, 1, 0...]
+    rotations = {}  # shift -> mask_list
+    for target, sources in aggregations:
+        for src in sources:
+            shift = src - target
+            if shift not in rotations:
+                rotations[shift] = [0] * vector_size
+            rotations[shift][target] = 1
+    final_result = None
+    for shift, mask_list in rotations.items():
+        # Optimization: Skip if mask is all zeros (no contribution from this rotation)
+        if not any(mask_list):
+            continue
+        # Create mask plaintext
+        # In a real implementation, we encode this list to a Plaintext
+        mask_tensor = tensor.constant(np.array(mask_list, dtype=np.int64))
+        mask_pt = bfv.encode(mask_tensor, encoder)
+        # Rotate
+        if shift == 0:
+            rotated_c = ciphertext
+        else:
+            rotated_c = bfv.rotate(ciphertext, shift, galois_keys)
+        # Mask
+        masked_c = bfv.mul(rotated_c, mask_pt)
+        # Accumulate
+        if final_result is None:
+            final_result = masked_c
+        else:
+            final_result = bfv.add(final_result, masked_c)
+    return final_result
+def masked_aggregate(ciphertexts: list[Any], masks: list[Any]) -> Any:
+    """Aggregate multiple partial results using masks.
+    Args:
+        ciphertexts: List of ciphertexts.
+        masks: List of plaintexts (masks).
+    Returns:
+        Sum(ct * mask)
+    """
+    if not ciphertexts or not masks:
+        raise ValueError("Empty input lists")
+    if len(ciphertexts) != len(masks):
+        raise ValueError("Mismatch in ciphertexts and masks length")
+    total = None
+    for ct, mask in zip(ciphertexts, masks, strict=True):
+        # ct * mask
+        masked = bfv.mul(ct, mask)
+        if total is None:
+            total = masked
+        else:
+            total = bfv.add(total, masked)
+    return total
+# ==============================================================================
+# SIMD Bucket Packing for Histogram Computation
+# ==============================================================================
+def strided_rotate_and_sum(
+    ciphertext: Any,
+    stride: int,
+    n_elements: int,
+    galois_keys: Any,
+    max_step: int = 1024,
+) -> Any:
+    """Aggregate elements at positions [0, stride, 2*stride, ...] into slot 0.
+    This is used for SIMD bucket packing where each bucket's values are
+    placed at strided positions.
+    Args:
+        ciphertext: The BFV ciphertext with values at strided positions.
+        stride: Distance between consecutive elements to sum.
+        n_elements: Number of elements to aggregate (at positions 0, stride, ..., (n-1)*stride).
+        galois_keys: Rotation keys.
+        max_step: Maximum rotation step for safe_rotate.
+    Returns:
+        Ciphertext where slot 0 contains sum of strided elements.
+    Example:
+        stride=64, n_elements=47 (bucket has 47 samples)
+        Values at slots: 0, 64, 128, 192, ...
+        Result: slot[0] = sum of all these values
+    """
+    if n_elements <= 1:
+        return ciphertext
+    # Use recursive doubling with strided rotations
+    # Step 1: rotate by stride, add -> pairs summed at even positions
+    # Step 2: rotate by 2*stride, add -> quads summed at positions 0, 4*stride, ...
+    # ...
+    num_steps = math.ceil(math.log2(n_elements))
+    current = ciphertext
+    for i in range(num_steps):
+        step = stride * (1 << i)
+        if step >= n_elements * stride:
+            break
+        rotated = _safe_rotate(current, step, galois_keys, max_step)
+        current = bfv.add(current, rotated)
+    return current
+def batch_bucket_aggregate(
+    ciphertext: Any,
+    n_buckets: int,
+    samples_per_bucket: int,
+    galois_keys: Any,
+    slot_count: int = 4096,
+) -> Any:
+    """Aggregate samples within each bucket region in a packed ciphertext.
+    Assumes the ciphertext has the following layout:
+    - slot_count is divided into n_buckets regions of size `stride = slot_count // n_buckets`
+    - Each bucket b occupies slots [b*stride, b*stride + samples_per_bucket)
+    - Samples are placed at consecutive positions within their bucket region
+    After aggregation, slot[b * stride] contains sum of bucket b.
+    Args:
+        ciphertext: Packed ciphertext with samples in bucket regions.
+        n_buckets: Number of buckets.
+        samples_per_bucket: Max samples per bucket (for rotation count).
+        galois_keys: Rotation keys.
+        slot_count: Total BFV slots.
+    Returns:
+        Ciphertext where slot[b * stride] = sum of bucket b's values.
+    """
+    if samples_per_bucket <= 1:
+        return ciphertext
+    # Use recursive doubling within each bucket region
+    # Since all buckets use the same relative positions, one set of rotations
+    # aggregates ALL buckets simultaneously!
+    num_steps = math.ceil(math.log2(samples_per_bucket))
+    current = ciphertext
+    for i in range(num_steps):
+        step = 1 << i
+        if step >= samples_per_bucket:
+            break
+        # Rotating by `step` shifts values within each bucket region
+        # Add original + rotated to sum pairs/quads/etc.
+        rotated = _safe_rotate(current, step, galois_keys)
+        current = bfv.add(current, rotated)
+    return current
+def extract_bucket_results(
+    vector: Any,
+    n_buckets: int,
+    slot_count: int = 4096,
+) -> Any:
+    """Extract bucket sums from a packed result vector.
+    After batch_bucket_aggregate, each bucket's sum is at slot[b * stride].
+    This function extracts those values.
+    Args:
+        vector: Decoded vector from packed ciphertext.
+        n_buckets: Number of buckets.
+        slot_count: Total slots.
+    Returns:
+        (n_buckets,) array of bucket sums.
+    """
+    import jax.numpy as jnp
+    stride = slot_count // n_buckets
+    indices = jnp.arange(n_buckets) * stride
+    return vector[indices]

mplang/v2/libs/mpc/analytics/groupby.md ADDED Viewed

@@ -0,0 +1,99 @@
+# Oblivious Group-by Sum Design
+This document outlines the design for Oblivious Group-by Sum algorithms in MPLang. The goal is to compute the sum of values in `data` (held by P0) grouped by `bins` (held by P1), such that:
+- P0 learns nothing about the `bins` (permutation/grouping).
+- P1 learns nothing about the `data` values (except the final aggregated sums).
+- The result is revealed to P1 (or shared).
+We propose two approaches based on the trade-off between communication and computation, and the cardinality of groups ($K$).
+## Interface
+```python
+def oblivious_groupby_sum(
+    data: Plaintext[P0],
+    bins: Plaintext[P1],
+    K: int,
+    method: str = "auto"
+) -> Plaintext[P1]:
+    """
+    Args:
+        data: Input data vector held by P0.
+        bins: Bin assignments for each data element held by P1.
+              Values must be in [0, K).
+        K: The number of bins (groups).
+        method: "bfv" (HE-based) or "shuffle" (OT-based).
+    Returns:
+        A vector of length K held by P1 containing the sum of data for each bin.
+    """
+```
+## Approach 1: HE-based (BFV SIMD)
+Best for: **Small K** (e.g., $K < 1000$), Low Bandwidth.
+### Algorithm
+1.  **Encryption (P0)**:
+    - P0 encrypts `data` using a BFV scheme with SIMD packing.
+    - Sends ciphertext(s) `Enc(data)` to P1.
+2.  **Aggregation (P1)**:
+    - P1 holds `bins`. For each bin $k \in [0, K)$:
+        - Construct a plaintext mask vector $M_k$ where $M_k[i] = 1$ if $bins[i] == k$, else $0$.
+        - Compute homomorphic multiplication: $Enc(Sum_k) = Enc(data) \otimes M_k$.
+        - Sum the slots in $Enc(Sum_k)$ to get the total sum for bin $k$.
+          - *Optimization*: Instead of full slot summation for every bin (which is expensive), P1 can just compute the element-wise product and accumulate. The final reduction can be done by sending back to P0 or using rotations if $K$ is small enough to pack into result ciphertexts.
+          - *Simplified Flow*: P1 computes $Enc(Partial_k) = Enc(data) \cdot M_k$. P1 sends these $K$ ciphertexts (or batched versions) back to P0.
+3.  **Decryption & Finalize (P0 -> P1)**:
+    - P0 decrypts the partial sums.
+    - P0 computes the sum of the vector for each bin.
+    - P0 sends the final $K$ sums to P1.
+    - *Privacy Note*: To prevent P0 from learning the partial sums (which reveals data distribution), P1 should add a random mask to the result before sending to P0, or use a proper threshold decryption if available. For the "Simplified Flow" above, P0 sees the masked data values. This might leak info.
+    - *Refined Privacy Flow*:
+        - P1 computes $Enc(V_k) = Enc(data) \cdot M_k$.
+        - P1 computes $Enc(S_k) = \text{TotalSum}(Enc(V_k))$ using rotations and additions.
+        - P1 masks $Enc(S_k)$ with a random value $r_k$: $Enc(O_k) = Enc(S_k) + Enc(r_k)$.
+        - P1 sends $Enc(O_k)$ to P0.
+        - P0 decrypts to get $O_k = S_k + r_k$ and sends back to P1.
+        - P1 subtracts $r_k$ to get $S_k$.
+### Complexity
+- **Comm**: $O(N/B)$ ciphertexts (P0->P1) + $O(K)$ ciphertexts (P1->P0). ($B$ is batch size).
+- **Comp**: $O(K \cdot N/B)$ homomorphic multiplications and additions.
+## Approach 2: OT-based (Shuffle + Prefix Sum)
+Best for: **Large K**, High Bandwidth.
+### Algorithm
+1.  **Sort Permutation (P1)**:
+    - P1 calculates a permutation $\pi$ that sorts `data` according to `bins`.
+    - P1 calculates boundary indices for each bin.
+2.  **Oblivious Shuffle (P0, P1)**:
+    - Use a Benes network or similar switching network.
+    - P0 inputs `data`. P1 inputs control bits derived from $\pi$.
+    - Output: Secret shares of permuted data $\langle D' \rangle_0, \langle D' \rangle_1$.
+3.  **Secret Shared Prefix Sum (P0, P1)**:
+    - Locally compute prefix sums of shares: $\langle S \rangle_0 = \text{cumsum}(\langle D' \rangle_0)$, $\langle S \rangle_1 = \text{cumsum}(\langle D' \rangle_1)$.
+4.  **Oblivious Gather (P0, P1)**:
+    - P1 knows the boundary indices $idx_k$.
+    - P1 needs $S[idx_k] = \langle S \rangle_0[idx_k] + \langle S \rangle_1[idx_k]$.
+    - P1 has $\langle S \rangle_1[idx_k]$ locally.
+    - To get $\langle S \rangle_0[idx_k]$ obliviously:
+        - Use another permutation network or ORAM to fetch these values without revealing $idx_k$ to P0.
+        - Or, since P1 is the result receiver, we can use a simpler selection protocol if we don't hide the access pattern from P0 (but we must hide it to protect bin sizes).
+        - A second shuffle network mapping $idx_k \to k$ is secure.
+5.  **Difference (P1)**:
+    - P1 computes $Result[k] = S[idx_k] - S[idx_{k-1}]$.
+### Complexity
+- **Comm**: $O(N \log N)$ bits for shuffle.
+- **Comp**: Low (symmetric crypto).

mplang-nightly 0.1.dev158__py3-none-any.whl → 0.1.dev268__py3-none-any.whl

mplang-nightly 0.1.dev158py3-none-any.whl → 0.1.dev268py3-none-any.whl