PyPI - cotengrust - Versions diffs - 0.1.1__tar.gz → 0.1.3__tar.gz - Mend

cotengrust 0.1.1tar.gz → 0.1.3tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

cotengrust-0.1.3/.github/workflows/CI.yml +138 -0
{cotengrust-0.1.1 → cotengrust-0.1.3}/Cargo.lock +34 -19
{cotengrust-0.1.1 → cotengrust-0.1.3}/Cargo.toml +3 -3
{cotengrust-0.1.1 → cotengrust-0.1.3}/PKG-INFO +83 -7
{cotengrust-0.1.1 → cotengrust-0.1.3}/README.md +81 -5
{cotengrust-0.1.1 → cotengrust-0.1.3}/pyproject.toml +2 -2
{cotengrust-0.1.1 → cotengrust-0.1.3}/src/lib.rs +203 -50
{cotengrust-0.1.1 → cotengrust-0.1.3}/tests/test_cotengrust.py +33 -3
cotengrust-0.1.1/.github/workflows/CI.yml +0 -162
{cotengrust-0.1.1 → cotengrust-0.1.3}/.gitignore +0 -0
{cotengrust-0.1.1 → cotengrust-0.1.3}/LICENSE +0 -0

cotengrust-0.1.3/.github/workflows/CI.yml ADDED Viewed

@@ -0,0 +1,138 @@
+# This file is autogenerated by maturin v1.5.1
+# To update, run
+#
+#    maturin generate-ci github
+#
+name: CI
+on:
+  push:
+    branches:
+      - main
+      - master
+    tags:
+      - '*'
+  pull_request:
+  workflow_dispatch:
+permissions:
+  contents: read
+jobs:
+  linux:
+    runs-on: ${{ matrix.platform.runner }}
+    strategy:
+      matrix:
+        platform:
+          - runner: ubuntu-latest
+            target: x86_64
+          - runner: ubuntu-latest
+            target: x86
+          - runner: ubuntu-latest
+            target: aarch64
+          - runner: ubuntu-latest
+            target: armv7
+          - runner: ubuntu-latest
+            target: s390x
+          - runner: ubuntu-latest
+            target: ppc64le
+    steps:
+      - uses: actions/checkout@v4
+      - uses: actions/setup-python@v5
+        with:
+          python-version: '3.10'
+      - name: Build wheels
+        uses: PyO3/maturin-action@v1
+        with:
+          target: ${{ matrix.platform.target }}
+          args: --release --out dist --find-interpreter
+          sccache: 'true'
+          manylinux: auto
+      - name: Upload wheels
+        uses: actions/upload-artifact@v4
+        with:
+          name: wheels-linux-${{ matrix.platform.target }}
+          path: dist
+  windows:
+    runs-on: ${{ matrix.platform.runner }}
+    strategy:
+      matrix:
+        platform:
+          - runner: windows-latest
+            target: x64
+          - runner: windows-latest
+            target: x86
+    steps:
+      - uses: actions/checkout@v4
+      - uses: actions/setup-python@v5
+        with:
+          python-version: '3.10'
+          architecture: ${{ matrix.platform.target }}
+      - name: Build wheels
+        uses: PyO3/maturin-action@v1
+        with:
+          target: ${{ matrix.platform.target }}
+          args: --release --out dist --find-interpreter
+          sccache: 'true'
+      - name: Upload wheels
+        uses: actions/upload-artifact@v4
+        with:
+          name: wheels-windows-${{ matrix.platform.target }}
+          path: dist
+  macos:
+    runs-on: ${{ matrix.platform.runner }}
+    strategy:
+      matrix:
+        platform:
+          - runner: macos-latest
+            target: x86_64
+          - runner: macos-14
+            target: aarch64
+    steps:
+      - uses: actions/checkout@v4
+      - uses: actions/setup-python@v5
+        with:
+          python-version: '3.10'
+      - name: Build wheels
+        uses: PyO3/maturin-action@v1
+        with:
+          target: ${{ matrix.platform.target }}
+          args: --release --out dist --find-interpreter
+          sccache: 'true'
+      - name: Upload wheels
+        uses: actions/upload-artifact@v4
+        with:
+          name: wheels-macos-${{ matrix.platform.target }}
+          path: dist
+  sdist:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Build sdist
+        uses: PyO3/maturin-action@v1
+        with:
+          command: sdist
+          args: --out dist
+      - name: Upload sdist
+        uses: actions/upload-artifact@v4
+        with:
+          name: wheels-sdist
+          path: dist
+  release:
+    name: Release
+    runs-on: ubuntu-latest
+    if: startsWith(github.ref, 'refs/tags/')
+    needs: [linux, windows, macos, sdist]
+    steps:
+      - uses: actions/download-artifact@v4
+      - name: Publish to PyPI
+        uses: PyO3/maturin-action@v1
+        env:
+          MATURIN_PYPI_TOKEN: ${{ secrets.PYPI_API_TOKEN }}
+        with:
+          command: upload
+          args: --non-interactive --skip-existing wheels-*/*

{cotengrust-0.1.1 → cotengrust-0.1.3}/Cargo.lock RENAMED Viewed

@@ -37,7 +37,7 @@ checksum = "baf1de4339761588bc0619e3cbc0120ee582ebb74b53b4efbf79117bd2da40fd"
 [[package]]
 name = "cotengrust"
-version = "0.1.1"
+version = "0.1.3"
 dependencies = [
  "bit-set",
  "ordered-float",
@@ -57,11 +57,17 @@ dependencies = [
  "wasi",
 ]
+[[package]]
+name = "heck"
+version = "0.4.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "95505c38b4572b2d910cecb0281560f54b440a19336cbbcb27bf6ce6adc6f5a8"
 [[package]]
 name = "indoc"
-version = "1.0.9"
+version = "2.0.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bfa799dd5ed20a7e349f3b4639aa80d74549c81716d9ec4f994c9b5815598306"
+checksum = "1e186cfbae8084e513daff4240b4797e342f988cecda4fb6c939150f96315fd8"
 [[package]]
 name = "libc"
@@ -105,9 +111,9 @@ checksum = "dd8b5dd2ae5ed71462c540258bedcb51965123ad7e7ccf4b9a8cafaa4a63576d"
 [[package]]
 name = "ordered-float"
-version = "3.9.1"
+version = "4.2.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2a54938017eacd63036332b4ae5c8a49fc8c0c1d6d629893057e4f13609edd06"
+checksum = "a76df7075c7d4d01fdcb46c912dd17fba5b60c78ea480b475f2b6ab6f666584e"
 dependencies = [
  "num-traits",
 ]
@@ -135,6 +141,12 @@ dependencies = [
  "windows-targets",
 ]
+[[package]]
+name = "portable-atomic"
+version = "1.6.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7170ef9988bc169ba16dd36a7fa041e5c4cbeb6a35b76d4c03daded371eae7c0"
 [[package]]
 name = "ppv-lite86"
 version = "0.2.17"
@@ -152,15 +164,16 @@ dependencies = [
 [[package]]
 name = "pyo3"
-version = "0.19.2"
+version = "0.21.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e681a6cfdc4adcc93b4d3cf993749a4552018ee0a9b65fc0ccfad74352c72a38"
+checksum = "a7a8b1990bd018761768d5e608a13df8bd1ac5f678456e0f301bb93e5f3ea16b"
 dependencies = [
  "cfg-if",
  "indoc",
  "libc",
  "memoffset",
  "parking_lot",
+ "portable-atomic",
  "pyo3-build-config",
  "pyo3-ffi",
  "pyo3-macros",
@@ -169,9 +182,9 @@ dependencies = [
 [[package]]
 name = "pyo3-build-config"
-version = "0.19.2"
+version = "0.21.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "076c73d0bc438f7a4ef6fdd0c3bb4732149136abd952b110ac93e4edb13a6ba5"
+checksum = "650dca34d463b6cdbdb02b1d71bfd6eb6b6816afc708faebb3bac1380ff4aef7"
 dependencies = [
  "once_cell",
  "target-lexicon",
@@ -179,9 +192,9 @@ dependencies = [
 [[package]]
 name = "pyo3-ffi"
-version = "0.19.2"
+version = "0.21.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e53cee42e77ebe256066ba8aa77eff722b3bb91f3419177cf4cd0f304d3284d9"
+checksum = "09a7da8fc04a8a2084909b59f29e1b8474decac98b951d77b80b26dc45f046ad"
 dependencies = [
  "libc",
  "pyo3-build-config",
@@ -189,9 +202,9 @@ dependencies = [
 [[package]]
 name = "pyo3-macros"
-version = "0.19.2"
+version = "0.21.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "dfeb4c99597e136528c6dd7d5e3de5434d1ceaf487436a3f03b2d56b6fc9efd1"
+checksum = "4b8a199fce11ebb28e3569387228836ea98110e43a804a530a9fd83ade36d513"
 dependencies = [
  "proc-macro2",
  "pyo3-macros-backend",
@@ -201,11 +214,13 @@ dependencies = [
 [[package]]
 name = "pyo3-macros-backend"
-version = "0.19.2"
+version = "0.21.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "947dc12175c254889edc0c02e399476c2f652b4b9ebd123aa655c224de259536"
+checksum = "93fbbfd7eb553d10036513cb122b888dcd362a945a00b06c165f2ab480d4cc3b"
 dependencies = [
+ "heck",
  "proc-macro2",
+ "pyo3-build-config",
  "quote",
  "syn",
 ]
@@ -278,9 +293,9 @@ checksum = "62bb4feee49fdd9f707ef802e22365a35de4b7b299de4763d44bfea899442ff9"
 [[package]]
 name = "syn"
-version = "1.0.109"
+version = "2.0.32"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "72b64191b275b66ffe2469e8af2c1cfe3bafa67b529ead792a6d0160888b4237"
+checksum = "239814284fd6f1a4ffe4ca893952cdd93c224b6a1571c9a9eadd670295c0c9e2"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -301,9 +316,9 @@ checksum = "301abaae475aa91687eb82514b328ab47a211a533026cb25fc3e519b86adfc3c"
 [[package]]
 name = "unindent"
-version = "0.1.11"
+version = "0.2.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e1766d682d402817b5ac4490b3c3002d91dfa0d22812f341609f97b08757359c"
+checksum = "c7de7d73e1754487cb58364ee906a499937a0dfabd86bcb980fa99ec8c8fa2ce"
 [[package]]
 name = "wasi"

{cotengrust-0.1.1 → cotengrust-0.1.3}/Cargo.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [package]
 name = "cotengrust"
-version = "0.1.1"
+version = "0.1.3"
 edition = "2021"
 # See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
@@ -10,8 +10,8 @@ crate-type = ["cdylib"]
 [dependencies]
 bit-set = "0.5"
-pyo3 = "0.19"
-ordered-float = "3.9"
+ordered-float = "4.2"
+pyo3 = "0.21"
 rand = "0.8"
 rustc-hash = "1.1"

{cotengrust-0.1.1 → cotengrust-0.1.3}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
-Metadata-Version: 2.1
+Metadata-Version: 2.3
 Name: cotengrust
-Version: 0.1.1
+Version: 0.1.3
 Classifier: Programming Language :: Rust
 Classifier: Programming Language :: Python :: Implementation :: CPython
 Classifier: Programming Language :: Python :: Implementation :: PyPy
@@ -19,9 +19,14 @@ are:
 - `optimize_optimal(inputs, output, size_dict, **kwargs)`
 - `optimize_greedy(inputs, output, size_dict, **kwargs)`
-The optimal algorithm is an optimized version of the `opt_einsum` 'dp'
+The optimal algorithm is an optimized version of the `opt_einsum` 'dp'
 path - itself an implementation of https://arxiv.org/abs/1304.6112.
+There is also a variant of the greedy algorithm, which runs `ntrials` of greedy,
+randomized paths and computes and reports the flops cost (log10) simultaneously:
+- `optimize_random_greedy_track_flops(inputs, output, size_dict, **kwargs)`
 ## Installation
@@ -32,7 +37,7 @@ path - itself an implementation of https://arxiv.org/abs/1304.6112.
 pip install cotengrust
 ```
-or if you want to develop locally (which requires [pyo3](https://github.com/PyO3/pyo3)
+or if you want to develop locally (which requires [pyo3](https://github.com/PyO3/pyo3)
 and [maturin](https://github.com/PyO3/maturin)):
 ```bash
@@ -46,8 +51,8 @@ maturin develop --release
 ## Usage
 If `cotengrust` is installed, then by default `cotengra` will use it for its
-greedy and optimal subroutines, notably subtree reconfiguration. You can also
-call the routines directly:
+greedy, random-greedy, and optimal subroutines, notably subtree
+reconfiguration. You can also call the routines directly:
 ```python
 import cotengra as ctg
@@ -171,7 +176,7 @@ def optimize_greedy(
         When assessing local greedy scores how much to weight the size of the
         tensors removed compared to the size of the tensor added::
-            score = size_ab - costmod * (size_a + size_b)
+            score = size_ab / costmod - (size_a + size_b) * costmod
         This can be a useful hyper-parameter to tune.
     temperature : float, optional
@@ -237,6 +242,77 @@ def optimize_simplify(
     """
     ...
+def optimize_random_greedy_track_flops(
+    inputs,
+    output,
+    size_dict,
+    ntrials=1,
+    costmod=(0.1, 4.0),
+    temperature=(0.001, 1.0),
+    seed=None,
+    simplify=True,
+    use_ssa=False,
+):
+    """Perform a batch of random greedy optimizations, simulteneously tracking
+    the best contraction path in terms of flops, so as to avoid constructing a
+    separate contraction tree.
+    Parameters
+    ----------
+    inputs : tuple[tuple[str]]
+        The indices of each input tensor.
+    output : tuple[str]
+        The indices of the output tensor.
+    size_dict : dict[str, int]
+        A dictionary mapping indices to their dimension.
+    ntrials : int, optional
+        The number of random greedy trials to perform. The default is 1.
+    costmod : (float, float), optional
+        When assessing local greedy scores how much to weight the size of the
+        tensors removed compared to the size of the tensor added::
+            score = size_ab / costmod - (size_a + size_b) * costmod
+        It is sampled uniformly from the given range.
+    temperature : (float, float), optional
+        When asessing local greedy scores, how much to randomly perturb the
+        score. This is implemented as::
+            score -> sign(score) * log(|score|) - temperature * gumbel()
+        which implements boltzmann sampling. It is sampled log-uniformly from
+        the given range.
+    seed : int, optional
+        The seed for the random number generator.
+    simplify : bool, optional
+        Whether to perform simplifications before optimizing. These are:
+            - ignore any indices that appear in all terms
+            - combine any repeated indices within a single term
+            - reduce any non-output indices that only appear on a single term
+            - combine any scalar terms
+            - combine any tensors with matching indices (hadamard products)
+        Such simpifications may be required in the general case for the proper
+        functioning of the core optimization, but may be skipped if the input
+        indices are already in a simplified form.
+    use_ssa : bool, optional
+        Whether to return the contraction path in 'single static assignment'
+        (SSA) format (i.e. as if each intermediate is appended to the list of
+        inputs, without removals). This can be quicker and easier to work with
+        than the 'linear recycled' format that `numpy` and `opt_einsum` use.
+    Returns
+    -------
+    path : list[list[int]]
+        The best contraction path, given as a sequence of pairs of node
+        indices.
+    flops : float
+        The flops (/ contraction cost / number of multiplications), of the best
+        contraction path, given log10.
+    """
+    ...
 def ssa_to_linear(ssa_path, n=None):
     """Convert a SSA path to linear format."""
     ...

{cotengrust-0.1.1 → cotengrust-0.1.3}/README.md RENAMED Viewed

@@ -7,9 +7,14 @@ are:
 - `optimize_optimal(inputs, output, size_dict, **kwargs)`
 - `optimize_greedy(inputs, output, size_dict, **kwargs)`
-The optimal algorithm is an optimized version of the `opt_einsum` 'dp'
+The optimal algorithm is an optimized version of the `opt_einsum` 'dp'
 path - itself an implementation of https://arxiv.org/abs/1304.6112.
+There is also a variant of the greedy algorithm, which runs `ntrials` of greedy,
+randomized paths and computes and reports the flops cost (log10) simultaneously:
+- `optimize_random_greedy_track_flops(inputs, output, size_dict, **kwargs)`
 ## Installation
@@ -20,7 +25,7 @@ path - itself an implementation of https://arxiv.org/abs/1304.6112.
 pip install cotengrust
 ```
-or if you want to develop locally (which requires [pyo3](https://github.com/PyO3/pyo3)
+or if you want to develop locally (which requires [pyo3](https://github.com/PyO3/pyo3)
 and [maturin](https://github.com/PyO3/maturin)):
 ```bash
@@ -34,8 +39,8 @@ maturin develop --release
 ## Usage
 If `cotengrust` is installed, then by default `cotengra` will use it for its
-greedy and optimal subroutines, notably subtree reconfiguration. You can also
-call the routines directly:
+greedy, random-greedy, and optimal subroutines, notably subtree
+reconfiguration. You can also call the routines directly:
 ```python
 import cotengra as ctg
@@ -159,7 +164,7 @@ def optimize_greedy(
         When assessing local greedy scores how much to weight the size of the
         tensors removed compared to the size of the tensor added::
-            score = size_ab - costmod * (size_a + size_b)
+            score = size_ab / costmod - (size_a + size_b) * costmod
         This can be a useful hyper-parameter to tune.
     temperature : float, optional
@@ -225,6 +230,77 @@ def optimize_simplify(
     """
     ...
+def optimize_random_greedy_track_flops(
+    inputs,
+    output,
+    size_dict,
+    ntrials=1,
+    costmod=(0.1, 4.0),
+    temperature=(0.001, 1.0),
+    seed=None,
+    simplify=True,
+    use_ssa=False,
+):
+    """Perform a batch of random greedy optimizations, simulteneously tracking
+    the best contraction path in terms of flops, so as to avoid constructing a
+    separate contraction tree.
+    Parameters
+    ----------
+    inputs : tuple[tuple[str]]
+        The indices of each input tensor.
+    output : tuple[str]
+        The indices of the output tensor.
+    size_dict : dict[str, int]
+        A dictionary mapping indices to their dimension.
+    ntrials : int, optional
+        The number of random greedy trials to perform. The default is 1.
+    costmod : (float, float), optional
+        When assessing local greedy scores how much to weight the size of the
+        tensors removed compared to the size of the tensor added::
+            score = size_ab / costmod - (size_a + size_b) * costmod
+        It is sampled uniformly from the given range.
+    temperature : (float, float), optional
+        When asessing local greedy scores, how much to randomly perturb the
+        score. This is implemented as::
+            score -> sign(score) * log(|score|) - temperature * gumbel()
+        which implements boltzmann sampling. It is sampled log-uniformly from
+        the given range.
+    seed : int, optional
+        The seed for the random number generator.
+    simplify : bool, optional
+        Whether to perform simplifications before optimizing. These are:
+            - ignore any indices that appear in all terms
+            - combine any repeated indices within a single term
+            - reduce any non-output indices that only appear on a single term
+            - combine any scalar terms
+            - combine any tensors with matching indices (hadamard products)
+        Such simpifications may be required in the general case for the proper
+        functioning of the core optimization, but may be skipped if the input
+        indices are already in a simplified form.
+    use_ssa : bool, optional
+        Whether to return the contraction path in 'single static assignment'
+        (SSA) format (i.e. as if each intermediate is appended to the list of
+        inputs, without removals). This can be quicker and easier to work with
+        than the 'linear recycled' format that `numpy` and `opt_einsum` use.
+    Returns
+    -------
+    path : list[list[int]]
+        The best contraction path, given as a sequence of pairs of node
+        indices.
+    flops : float
+        The flops (/ contraction cost / number of multiplications), of the best
+        contraction path, given log10.
+    """
+    ...
 def ssa_to_linear(ssa_path, n=None):
     """Convert a SSA path to linear format."""
     ...

{cotengrust-0.1.1 → cotengrust-0.1.3}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "cotengrust"
-version = "0.1.1"
+version = "0.1.3"
 description = "Fast contraction ordering primitives for tensor networks."
 readme = "README.md"
 requires-python = ">=3.8"
@@ -15,7 +15,7 @@ authors = [
 ]
 [build-system]
-requires = ["maturin>=0.15,<0.16"]
+requires = ["maturin>=1.0,<2.0"]
 build-backend = "maturin"
 [tool.maturin]

{cotengrust-0.1.1 → cotengrust-0.1.3}/src/lib.rs RENAMED Viewed

@@ -2,8 +2,9 @@ use bit_set::BitSet;
 use ordered_float::OrderedFloat;
 use pyo3::prelude::*;
 use rand::Rng;
+use rand::SeedableRng;
 use rustc_hash::FxHashMap;
-use std::collections::{BTreeSet, BinaryHeap};
+use std::collections::{BTreeSet, BinaryHeap, HashSet};
 use std::f32;
 use FxHashMap as Dict;
@@ -23,6 +24,7 @@ type BitPath = Vec<(Subgraph, Subgraph)>;
 type SubContraction = (Legs, Score, BitPath);
 /// helper struct to build contractions from bottom up
+#[derive(Clone)]
 struct ContractionProcessor {
     nodes: Dict<Node, Legs>,
     edges: Dict<Ix, BTreeSet<Node>>,
@@ -30,6 +32,9 @@ struct ContractionProcessor {
     sizes: Vec<Score>,
     ssa: Node,
     ssa_path: SSAPath,
+    track_flops: bool,
+    flops: Score,
+    flops_limit: Score,
 }
 /// given log(x) and log(y) compute log(x + y), without exponentiating both
@@ -94,6 +99,21 @@ fn compute_size(legs: &Legs, sizes: &Vec<Score>) -> Score {
     legs.iter().map(|&(ix, _)| sizes[ix as usize]).sum()
 }
+fn compute_flops(ilegs: &Legs, jlegs: &Legs, sizes: &Vec<Score>) -> Score {
+    let mut flops: Score = 0.0;
+    let mut seen: HashSet<Ix> = HashSet::with_capacity(ilegs.len());
+    for &(ix, _) in ilegs {
+        seen.insert(ix);
+        flops += sizes[ix as usize];
+    }
+    for (ix, _) in jlegs {
+        if !seen.contains(ix) {
+            flops += sizes[*ix as usize];
+        }
+    }
+    flops
+}
 fn is_simplifiable(legs: &Legs, appearances: &Vec<Count>) -> bool {
     let mut prev_ix = Node::MAX;
     for &(ix, ix_count) in legs {
@@ -131,7 +151,12 @@ impl ContractionProcessor {
         inputs: Vec<Vec<char>>,
         output: Vec<char>,
         size_dict: Dict<char, f32>,
+        track_flops: bool,
     ) -> ContractionProcessor {
+        if size_dict.len() > Ix::MAX as usize {
+            panic!("cotengrust: too many indices, maximum is {}", Ix::MAX);
+        }
         let mut nodes: Dict<Node, Legs> = Dict::default();
         let mut edges: Dict<Ix, BTreeSet<Node>> = Dict::default();
         let mut indmap: Dict<char, Ix> = Dict::default();
@@ -149,7 +174,7 @@ impl ContractionProcessor {
                         indmap.insert(ind, c);
                         edges.insert(c, std::iter::once(i as Node).collect());
                         appearances.push(1);
-                        sizes.push(f32::log(size_dict[&ind] as f32, 2.0));
+                        sizes.push(f32::ln(size_dict[&ind] as f32));
                         legs.push((c, 1));
                         c += 1;
                     }
@@ -170,6 +195,8 @@ impl ContractionProcessor {
         let ssa = nodes.len() as Node;
         let ssa_path: SSAPath = Vec::with_capacity(2 * ssa as usize - 1);
+        let flops: Score = 0.0;
+        let flops_limit: Score = Score::INFINITY;
         ContractionProcessor {
             nodes,
@@ -178,6 +205,9 @@ impl ContractionProcessor {
             sizes,
             ssa,
             ssa_path,
+            track_flops,
+            flops,
+            flops_limit,
         }
     }
@@ -225,7 +255,9 @@ impl ContractionProcessor {
         for (ix, _) in &legs {
             self.edges
                 .entry(*ix)
-                .and_modify(|nodes| {nodes.insert(i);})
+                .and_modify(|nodes| {
+                    nodes.insert(i);
+                })
                 .or_insert(std::iter::once(i as Node).collect());
         }
         self.nodes.insert(i, legs);
@@ -236,12 +268,27 @@ impl ContractionProcessor {
     fn contract_nodes(&mut self, i: Node, j: Node) -> Node {
         let ilegs = self.pop_node(i);
         let jlegs = self.pop_node(j);
+        if self.track_flops {
+            self.flops = logadd(self.flops, compute_flops(&ilegs, &jlegs, &self.sizes));
+        }
         let new_legs = compute_legs(&ilegs, &jlegs, &self.appearances);
         let k = self.add_node(new_legs);
         self.ssa_path.push(vec![i, j]);
         k
     }
+    /// contract two nodes (which we already know the legs for), return the new node id
+    fn contract_nodes_given_legs(&mut self, i: Node, j: Node, new_legs: Legs) -> Node {
+        let ilegs = self.pop_node(i);
+        let jlegs = self.pop_node(j);
+        if self.track_flops {
+            self.flops = logadd(self.flops, compute_flops(&ilegs, &jlegs, &self.sizes));
+        }
+        let k = self.add_node(new_legs);
+        self.ssa_path.push(vec![i, j]);
+        k
+    }
     /// find any indices that appear in all terms and just remove/ignore them
     fn simplify_batch(&mut self) {
         let mut ix_to_remove = Vec::new();
@@ -366,18 +413,32 @@ impl ContractionProcessor {
     }
     /// greedily optimize the contraction order of all terms
-    fn optimize_greedy(&mut self, costmod: Option<f32>, temperature: Option<f32>) {
-        let mut rng = rand::thread_rng();
+    fn optimize_greedy(
+        &mut self,
+        costmod: Option<f32>,
+        temperature: Option<f32>,
+        seed: Option<u64>,
+    ) -> bool {
         let coeff_t = temperature.unwrap_or(0.0);
         let log_coeff_a = f32::ln(costmod.unwrap_or(1.0));
+        let mut rng = if coeff_t != 0.0 {
+            Some(match seed {
+                Some(seed) => rand::rngs::StdRng::seed_from_u64(seed),
+                None => rand::rngs::StdRng::from_entropy(),
+            })
+        } else {
+            // zero temp - no need for rng
+            None
+        };
         let mut local_score = |sa: Score, sb: Score, sab: Score| -> Score {
-            let gumbel = if coeff_t != 0.0 {
+            let gumbel = if let Some(rng) = &mut rng {
                 coeff_t * -f32::ln(-f32::ln(rng.gen()))
             } else {
                 0.0 as f32
             };
-            logsub(sab, log_coeff_a + logadd(sa, sb)) - gumbel
+            logsub(sab - log_coeff_a, logadd(sa, sb) + log_coeff_a) - gumbel
         };
         // cache all current nodes sizes as we go
@@ -424,11 +485,13 @@ impl ContractionProcessor {
             }
             // perform contraction:
-            // we already have the legs, so don't call contract_nodes
-            self.pop_node(i);
-            self.pop_node(j);
-            let k = self.add_node(klegs.clone());
-            self.ssa_path.push(vec![i, j]);
+            let k = self.contract_nodes_given_legs(i, j, klegs.clone());
+            if self.track_flops && self.flops >= self.flops_limit {
+                // stop if we have reached the flops limit
+                return false;
+            }
             node_sizes.insert(k, ksize);
             for l in self.neighbors(k) {
@@ -444,6 +507,8 @@ impl ContractionProcessor {
                 c -= 1;
             }
         }
+        // success
+        return true;
     }
     /// Optimize the contraction order of all terms using a greedy algorithm
@@ -800,7 +865,6 @@ impl ContractionProcessor {
 // --------------------------- PYTHON FUNCTIONS ---------------------------- //
 #[pyfunction]
-#[pyo3()]
 fn ssa_to_linear(ssa_path: SSAPath, n: Option<usize>) -> SSAPath {
     let n = match n {
         Some(n) => n,
@@ -828,18 +892,16 @@ fn ssa_to_linear(ssa_path: SSAPath, n: Option<usize>) -> SSAPath {
 }
 #[pyfunction]
-#[pyo3()]
 fn find_subgraphs(
     inputs: Vec<Vec<char>>,
     output: Vec<char>,
     size_dict: Dict<char, f32>,
 ) -> Vec<Vec<Node>> {
-    let cp = ContractionProcessor::new(inputs, output, size_dict);
+    let cp = ContractionProcessor::new(inputs, output, size_dict, false);
     cp.subgraphs()
 }
 #[pyfunction]
-#[pyo3()]
 fn optimize_simplify(
     inputs: Vec<Vec<char>>,
     output: Vec<char>,
@@ -847,7 +909,7 @@ fn optimize_simplify(
     use_ssa: Option<bool>,
 ) -> SSAPath {
     let n = inputs.len();
-    let mut cp = ContractionProcessor::new(inputs, output, size_dict);
+    let mut cp = ContractionProcessor::new(inputs, output, size_dict, false);
     cp.simplify();
     if use_ssa.unwrap_or(false) {
         cp.ssa_path
@@ -857,36 +919,124 @@ fn optimize_simplify(
 }
 #[pyfunction]
-#[pyo3()]
 fn optimize_greedy(
+    py: Python,
     inputs: Vec<Vec<char>>,
     output: Vec<char>,
     size_dict: Dict<char, f32>,
     costmod: Option<f32>,
     temperature: Option<f32>,
+    seed: Option<u64>,
     simplify: Option<bool>,
     use_ssa: Option<bool>,
 ) -> Vec<Vec<Node>> {
-    let n = inputs.len();
-    let mut cp = ContractionProcessor::new(inputs, output, size_dict);
-    if simplify.unwrap_or(true) {
-        // perform simplifications
-        cp.simplify();
-    }
-    // greddily contract each connected subgraph
-    cp.optimize_greedy(costmod, temperature);
-    // optimize any remaining disconnected terms
-    cp.optimize_remaining_by_size();
-    if use_ssa.unwrap_or(false) {
-        cp.ssa_path
-    } else {
-        ssa_to_linear(cp.ssa_path, Some(n))
-    }
+    py.allow_threads(|| {
+        let n = inputs.len();
+        let mut cp = ContractionProcessor::new(inputs, output, size_dict, false);
+        if simplify.unwrap_or(true) {
+            // perform simplifications
+            cp.simplify();
+        }
+        // greedily contract each connected subgraph
+        cp.optimize_greedy(costmod, temperature, seed);
+        // optimize any remaining disconnected terms
+        cp.optimize_remaining_by_size();
+        if use_ssa.unwrap_or(false) {
+            cp.ssa_path
+        } else {
+            ssa_to_linear(cp.ssa_path, Some(n))
+        }
+    })
+}
+#[pyfunction]
+fn optimize_random_greedy_track_flops(
+    py: Python,
+    inputs: Vec<Vec<char>>,
+    output: Vec<char>,
+    size_dict: Dict<char, f32>,
+    ntrials: usize,
+    costmod: Option<(f32, f32)>,
+    temperature: Option<(f32, f32)>,
+    seed: Option<u64>,
+    simplify: Option<bool>,
+    use_ssa: Option<bool>,
+) -> (Vec<Vec<Node>>, Score) {
+    py.allow_threads(|| {
+        let (costmod_min, costmod_max) = costmod.unwrap_or((0.1, 4.0));
+        let costmod_diff = (costmod_max - costmod_min).abs();
+        let is_const_costmod = costmod_diff < Score::EPSILON;
+        let (temp_min, temp_max) = temperature.unwrap_or((0.001, 1.0));
+        let log_temp_min = Score::ln(temp_min);
+        let log_temp_max = Score::ln(temp_max);
+        let log_temp_diff = (log_temp_max - log_temp_min).abs();
+        let is_const_temp = log_temp_diff < Score::EPSILON;
+        let mut rng = match seed {
+            Some(seed) => rand::rngs::StdRng::seed_from_u64(seed),
+            None => rand::rngs::StdRng::from_entropy(),
+        };
+        let seeds = (0..ntrials).map(|_| rng.gen()).collect::<Vec<u64>>();
+        let n: usize = inputs.len();
+        // construct processor and perform simplifications once
+        let mut cp0 = ContractionProcessor::new(inputs, output, size_dict, true);
+        if simplify.unwrap_or(true) {
+            cp0.simplify();
+        }
+        let mut best_path = None;
+        let mut best_flops = f32::INFINITY;
+        for seed in seeds {
+            let mut cp = cp0.clone();
+            // uniform sample for costmod
+            let costmod = if is_const_costmod {
+                costmod_min
+            } else {
+                costmod_min + rng.gen::<f32>() * costmod_diff
+            };
+            // log-uniform sample for temperature
+            let temperature = if is_const_temp {
+                temp_min
+            } else {
+                f32::exp(log_temp_min + rng.gen::<f32>() * log_temp_diff)
+            };
+            // greedily contract each connected subgraph
+            let success = cp.optimize_greedy(Some(costmod), Some(temperature), Some(seed));
+            if !success {
+                continue;
+            }
+            // optimize any remaining disconnected terms
+            cp.optimize_remaining_by_size();
+            if cp.flops < best_flops {
+                best_path = Some(cp.ssa_path);
+                best_flops = cp.flops;
+                cp0.flops_limit = cp.flops;
+            }
+        }
+        // convert to base 10 for easier comparison
+        best_flops *= f32::consts::LOG10_E;
+        if use_ssa.unwrap_or(false) {
+            (best_path.unwrap(), best_flops)
+        } else {
+            (ssa_to_linear(best_path.unwrap(), Some(n)), best_flops)
+        }
+    })
 }
 #[pyfunction]
-#[pyo3()]
 fn optimize_optimal(
+    py: Python,
     inputs: Vec<Vec<char>>,
     output: Vec<char>,
     size_dict: Dict<char, f32>,
@@ -896,30 +1046,33 @@ fn optimize_optimal(
     simplify: Option<bool>,
     use_ssa: Option<bool>,
 ) -> Vec<Vec<Node>> {
-    let n = inputs.len();
-    let mut cp = ContractionProcessor::new(inputs, output, size_dict);
-    if simplify.unwrap_or(true) {
-        // perform simplifications
-        cp.simplify();
-    }
-    // optimally contract each connected subgraph
-    cp.optimize_optimal(minimize, cost_cap, search_outer);
-    // optimize any remaining disconnected terms
-    cp.optimize_remaining_by_size();
-    if use_ssa.unwrap_or(false) {
-        cp.ssa_path
-    } else {
-        ssa_to_linear(cp.ssa_path, Some(n))
-    }
+    py.allow_threads(|| {
+        let n = inputs.len();
+        let mut cp = ContractionProcessor::new(inputs, output, size_dict, false);
+        if simplify.unwrap_or(true) {
+            // perform simplifications
+            cp.simplify();
+        }
+        // optimally contract each connected subgraph
+        cp.optimize_optimal(minimize, cost_cap, search_outer);
+        // optimize any remaining disconnected terms
+        cp.optimize_remaining_by_size();
+        if use_ssa.unwrap_or(false) {
+            cp.ssa_path
+        } else {
+            ssa_to_linear(cp.ssa_path, Some(n))
+        }
+    })
 }
 /// A Python module implemented in Rust.
 #[pymodule]
-fn cotengrust(_py: Python, m: &PyModule) -> PyResult<()> {
+fn cotengrust(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_function(wrap_pyfunction!(ssa_to_linear, m)?)?;
     m.add_function(wrap_pyfunction!(find_subgraphs, m)?)?;
     m.add_function(wrap_pyfunction!(optimize_simplify, m)?)?;
     m.add_function(wrap_pyfunction!(optimize_greedy, m)?)?;
+    m.add_function(wrap_pyfunction!(optimize_random_greedy_track_flops, m)?)?;
     m.add_function(wrap_pyfunction!(optimize_optimal, m)?)?;
     Ok(())
 }

{cotengrust-0.1.1 → cotengrust-0.1.3}/tests/test_cotengrust.py RENAMED Viewed

@@ -56,6 +56,15 @@ def get_rand_size_dict(inputs, d_min=2, d_max=3):
 # these are taken from opt_einsum
 test_case_eqs = [
+    # Test single-term equations
+    "->",
+    "a->a",
+    "ab->ab",
+    "ab->ba",
+    "abc->bca",
+    "abc->b",
+    "baa->ba",
+    "aba->b",
     # Test scalar-like operations
     "a,->a",
     "ab,->ab",
@@ -188,18 +197,39 @@ def test_basic_rand(seed, which):
 @requires_cotengra
 def test_optimal_lattice_eq():
     inputs, output, _, size_dict = ctg.utils.lattice_equation(
-        [4, 5], d_max=3, seed=42
+        [4, 5], d_max=2, seed=42
     )
     path = ctgr.optimize_optimal(inputs, output, size_dict, minimize='flops')
     tree = ctg.ContractionTree.from_path(
         inputs, output, size_dict, path=path
     )
-    assert tree.contraction_cost() == 3628
+    assert tree.is_complete()
+    assert tree.contraction_cost() == 964
     path = ctgr.optimize_optimal(inputs, output, size_dict, minimize='size')
     assert all(len(con) <= 2 for con in path)
     tree = ctg.ContractionTree.from_path(
         inputs, output, size_dict, path=path
     )
-    assert tree.contraction_width() == pytest.approx(6.754887502163468)
+    assert tree.contraction_width() == pytest.approx(5)
+@requires_cotengra
+def test_optimize_random_greedy_log_flops():
+    inputs, output, _, size_dict = ctg.utils.lattice_equation(
+        [10, 10], d_max=3, seed=42
+    )
+    path, cost1 = ctgr.optimize_random_greedy_track_flops(
+        inputs, output, size_dict, ntrials=4, seed=42
+    )
+    _, cost2 = ctgr.optimize_random_greedy_track_flops(
+        inputs, output, size_dict, ntrials=4, seed=42
+    )
+    assert cost1 == cost2
+    tree = ctg.ContractionTree.from_path(
+        inputs, output, size_dict, path=path
+    )
+    assert tree.is_complete()
+    assert tree.contraction_cost(log=10) == pytest.approx(cost1)

cotengrust-0.1.1/.github/workflows/CI.yml DELETED Viewed

@@ -1,162 +0,0 @@
-# This file is autogenerated by maturin v1.2.3
-# To update, run
-#
-#    maturin generate-ci github --pytest
-#
-name: CI
-on:
-  push:
-    branches:
-      - main
-      - master
-    tags:
-      - '*'
-  pull_request:
-  workflow_dispatch:
-permissions:
-  contents: read
-jobs:
-  linux:
-    runs-on: ubuntu-latest
-    strategy:
-      matrix:
-        target: [x86_64, x86, aarch64, armv7, s390x, ppc64le]
-    steps:
-      - uses: actions/checkout@v3
-      - uses: actions/setup-python@v4
-        with:
-          python-version: '3.10'
-      - name: Build wheels
-        uses: PyO3/maturin-action@v1
-        with:
-          target: ${{ matrix.target }}
-          args: --release --out dist --find-interpreter
-          sccache: 'true'
-          manylinux: auto
-      - name: Upload wheels
-        uses: actions/upload-artifact@v3
-        with:
-          name: wheels
-          path: dist
-      - name: pytest
-        if: ${{ startsWith(matrix.target, 'x86_64') }}
-        shell: bash
-        run: |
-          set -e
-          ls dist/*
-          pip install cotengrust --find-links dist --force-reinstall
-          pip install pytest numpy cotengra
-          pytest --verbose
-      - name: pytest
-        if: ${{ !startsWith(matrix.target, 'x86') && matrix.target != 'ppc64' }}
-        uses: uraimo/run-on-arch-action@v2.5.0
-        with:
-          arch: ${{ matrix.target }}
-          distro: ubuntu22.04
-          githubToken: ${{ github.token }}
-          install: |
-            apt-get update
-            apt-get install -y --no-install-recommends python3 python3-pip
-            pip3 install -U pip pytest # numpy cotengra
-          run: |
-            set -e
-            pip3 install cotengrust --find-links dist --force-reinstall
-            pytest --verbose
-  windows:
-    runs-on: windows-latest
-    strategy:
-      matrix:
-        target: [x64, x86]
-    steps:
-      - uses: actions/checkout@v3
-      - uses: actions/setup-python@v4
-        with:
-          python-version: '3.10'
-          architecture: ${{ matrix.target }}
-      - name: Build wheels
-        uses: PyO3/maturin-action@v1
-        with:
-          target: ${{ matrix.target }}
-          args: --release --out dist --find-interpreter
-          sccache: 'true'
-      - name: Upload wheels
-        uses: actions/upload-artifact@v3
-        with:
-          name: wheels
-          path: dist
-      - name: pytest
-        if: ${{ !startsWith(matrix.target, 'aarch64') }}
-        shell: bash
-        run: |
-          set -e
-          ls dist/*
-          pip install cotengrust --find-links dist --force-reinstall
-          pip install pytest numpy cotengra
-          pytest --verbose
-  macos:
-    runs-on: macos-latest
-    strategy:
-      matrix:
-        target: [x86_64, aarch64]
-    steps:
-      - uses: actions/checkout@v3
-      - uses: actions/setup-python@v4
-        with:
-          python-version: '3.10'
-      - name: Build wheels
-        uses: PyO3/maturin-action@v1
-        with:
-          target: ${{ matrix.target }}
-          args: --release --out dist --find-interpreter
-          sccache: 'true'
-      - name: Upload wheels
-        uses: actions/upload-artifact@v3
-        with:
-          name: wheels
-          path: dist
-      - name: pytest
-        if: ${{ !startsWith(matrix.target, 'aarch64') }}
-        shell: bash
-        run: |
-          set -e
-          ls dist/*
-          pip install cotengrust --find-links dist --force-reinstall
-          pip install pytest numpy cotengra
-          pytest --verbose
-  sdist:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v3
-      - name: Build sdist
-        uses: PyO3/maturin-action@v1
-        with:
-          command: sdist
-          args: --out dist
-      - name: Upload sdist
-        uses: actions/upload-artifact@v3
-        with:
-          name: wheels
-          path: dist
-  release:
-    name: Release
-    runs-on: ubuntu-latest
-    if: startsWith(github.ref, 'refs/tags/')
-    needs: [linux, windows, macos, sdist]
-    steps:
-      - uses: actions/download-artifact@v3
-        with:
-          name: wheels
-      - name: Publish to PyPI
-        uses: PyO3/maturin-action@v1
-        env:
-          MATURIN_PYPI_TOKEN: ${{ secrets.PYPI_API_TOKEN }}
-        with:
-          command: upload
-          args: --non-interactive --skip-existing *

{cotengrust-0.1.1 → cotengrust-0.1.3}/.gitignore RENAMED Viewed

File without changes

{cotengrust-0.1.1 → cotengrust-0.1.3}/LICENSE RENAMED Viewed

File without changes

cotengrust 0.1.1__tar.gz → 0.1.3__tar.gz

cotengrust 0.1.1tar.gz → 0.1.3tar.gz