PyPI - mdot-tnt - Versions diffs - 0.1.0__py3-none-any.whl → 1.0.0__py3-none-any.whl - Mend

mdot-tnt 0.1.0py3-none-any.whl → 1.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

mdot_tnt/__init__.py +52 -8
mdot_tnt/batched.py +634 -0
mdot_tnt/mdot.py +105 -41
mdot_tnt/py.typed +0 -0
mdot_tnt/rounding.py +41 -15
mdot_tnt/truncated_newton.py +107 -38
mdot_tnt-1.0.0.dist-info/METADATA +216 -0
mdot_tnt-1.0.0.dist-info/RECORD +11 -0
{mdot_tnt-0.1.0.dist-info → mdot_tnt-1.0.0.dist-info}/WHEEL +1 -1
{mdot_tnt-0.1.0.dist-info → mdot_tnt-1.0.0.dist-info/licenses}/LICENSE +4 -1
mdot_tnt-0.1.0.dist-info/METADATA +0 -71
mdot_tnt-0.1.0.dist-info/RECORD +0 -9
{mdot_tnt-0.1.0.dist-info → mdot_tnt-1.0.0.dist-info}/top_level.txt +0 -0

mdot_tnt/__init__.py CHANGED Viewed

@@ -1,11 +1,48 @@
+"""
+MDOT-TNT: A Truncated Newton Method for Optimal Transport
+This package provides efficient solvers for the entropic-regularized optimal transport
+problem, as introduced in the paper "A Truncated Newton Method for Optimal Transport"
+by Mete Kemertas, Amir-massoud Farahmand, Allan D. Jepson (ICLR, 2025).
+URL: https://openreview.net/forum?id=gWrWUaCbMa
+Main functions:
+    solve_OT: Solve a single OT problem.
+    solve_OT_batched: Solve multiple OT problems simultaneously (5-10x faster).
+Example:
+    >>> import torch
+    >>> from mdot_tnt import solve_OT, solve_OT_batched
+    >>>
+    >>> # Single problem
+    >>> r = torch.rand(512, device='cuda', dtype=torch.float64)
+    >>> r = r / r.sum()
+    >>> c = torch.rand(512, device='cuda', dtype=torch.float64)
+    >>> c = c / c.sum()
+    >>> C = torch.rand(512, 512, device='cuda', dtype=torch.float64)
+    >>> cost = solve_OT(r, c, C, gamma_f=1024.)
+    >>>
+    >>> # Batched (32 problems at once)
+    >>> r_batch = torch.rand(32, 512, device='cuda', dtype=torch.float64)
+    >>> r_batch = r_batch / r_batch.sum(-1, keepdim=True)
+    >>> c_batch = torch.rand(32, 512, device='cuda', dtype=torch.float64)
+    >>> c_batch = c_batch / c_batch.sum(-1, keepdim=True)
+    >>> costs = solve_OT_batched(r_batch, c_batch, C, gamma_f=1024.)
+"""
+import math
+import warnings
 import torch as th
-from mdot_tnt.mdot import mdot
+from mdot_tnt.batched import solve_OT_batched
+from mdot_tnt.mdot import mdot, preprocess_marginals
 from mdot_tnt.rounding import round_altschuler, rounded_cost_altschuler
+__all__ = ["solve_OT", "solve_OT_batched"]
-def solve_OT(r, c, C, gamma_f=4096., drop_tiny=False, return_plan=False, round=True, log=False):
+def solve_OT(r, c, C, gamma_f=1024.0, drop_tiny=False, return_plan=False, round=True, log=False):
     """
     Solve the entropic-regularized optimal transport problem. Inputs r, c, C are required to be torch tensors.
     :param r: n-dimensional row marginal.
@@ -23,21 +60,28 @@ def solve_OT(r, c, C, gamma_f=4096., drop_tiny=False, return_plan=False, round=T
     """
     assert all(isinstance(x, th.Tensor) for x in [r, c, C]), "r, c, and C must be torch tensors"
     dtype = r.dtype
-    if gamma_f > 2 ** 10:
+    # Require high precision for gamma_f > 2^10
+    if gamma_f > 2**10 and dtype != th.float64:
+        warnings.warn(
+            "Switching to double precision for gamma_f > 2^10 during execution. "
+            f"Output will be input dtype: {dtype}."
+        )
         r, c, C = r.double(), c.double(), C.double()
     if drop_tiny:
-        drop_lessthan = math.log(min(r.size(-1), c.size(-1))) / (gamma_f ** 2)
+        drop_lessthan = math.log(min(r.size(-1), c.size(-1))) / (gamma_f**2)
         (r_, r_keep), (c_, c_keep), C_ = preprocess_marginals(r, c, C, drop_lessthan)
         u_, v_, gamma_f_, k_total, opt_logs = mdot(r_, c_, C_, gamma_f)
-        u = -th.ones_like(r) * float('inf')
-        u[:, r_keep] = u_
-        v = -th.ones_like(c) * float('inf')
-        v[:, c_keep] = v_
+        u = -th.ones_like(r) * float("inf")
+        u[r_keep] = u_
+        v = -th.ones_like(c) * float("inf")
+        v[c_keep] = v_
     else:
         u, v, gamma_f_, k_total, opt_logs = mdot(r, c, C, gamma_f)
+    # Switch back to original dtype
     u, v = u.to(dtype), v.to(dtype)
     if return_plan:

mdot-tnt 0.1.0__py3-none-any.whl → 1.0.0__py3-none-any.whl

mdot-tnt 0.1.0py3-none-any.whl → 1.0.0py3-none-any.whl