PyPI - torchax - Versions diffs - 0.0.4__py3-none-any.whl → 0.0.6__py3-none-any.whl - Mend

torchax 0.0.4py3-none-any.whl → 0.0.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of torchax might be problematic. Click here for more details.

Files changed (32) hide show

torchax/CONTRIBUTING.md +2 -2
torchax/__init__.py +26 -24
torchax/amp.py +332 -0
torchax/config.py +25 -14
torchax/configuration.py +30 -0
torchax/decompositions.py +663 -195
torchax/device_module.py +14 -1
torchax/environment.py +0 -1
torchax/export.py +26 -17
torchax/flax.py +39 -0
torchax/interop.py +288 -141
torchax/mesh_util.py +220 -0
torchax/ops/jaten.py +1723 -1297
torchax/ops/jax_reimplement.py +23 -21
torchax/ops/jc10d.py +5 -4
torchax/ops/jimage.py +113 -0
torchax/ops/jlibrary.py +9 -2
torchax/ops/jtorch.py +237 -88
torchax/ops/jtorchvision_nms.py +32 -43
torchax/ops/mappings.py +77 -35
torchax/ops/op_base.py +59 -32
torchax/ops/ops_registry.py +40 -35
torchax/tensor.py +442 -288
torchax/train.py +38 -41
torchax/util.py +88 -0
torchax/view.py +377 -0
{torchax-0.0.4.dist-info → torchax-0.0.6.dist-info}/METADATA +111 -145
torchax-0.0.6.dist-info/RECORD +33 -0
torchax/distributed.py +0 -246
torchax-0.0.4.dist-info/RECORD +0 -27
{torchax-0.0.4.dist-info → torchax-0.0.6.dist-info}/WHEEL +0 -0
{torchax-0.0.4.dist-info → torchax-0.0.6.dist-info}/licenses/LICENSE +0 -0

torchax/tensor.py CHANGED Viewed

@@ -1,3 +1,4 @@
+import threading
 import logging
 import sys
 import contextlib
@@ -5,15 +6,17 @@ from typing import Optional, Any
 import jax
 import jax.numpy as jnp
 import numpy
+import itertools
 import torch
 import torch.distributed._functional_collectives
 import torch.func
 import torch.utils._mode_utils as mode_utils
 import torch.utils._python_dispatch as torch_dispatch
 import torch.utils._pytree as torch_pytree
+from torchax.view import View
 from torchax import config
 from torchax.ops import mappings, ops_registry
+from torchax import amp
 logger = logging.getLogger(__name__)
@@ -22,63 +25,42 @@ class OperatorNotFound(Exception):
   pass
-def wrap(jaxarray):
-  return torch_pytree.tree_map_only(jnp.ndarray, Tensor, jaxarray)
-def unwrap(torchtensors):
-  return torch_pytree.tree_map_only(Tensor, lambda x: x._elem, torchtensors)
-def t2j(t):
-  if isinstance(t, Tensor):
-    return t._elem
-  return mappings.t2j(t)
-def j2t(x):
-  return mappings.j2t(x)
-def t2j_dtype(dtype):
-  return mappings.t2j_dtype(dtype)
-def j2t_dtype(dtype):
-  return mappings.j2t_dtype(dtype)
 @contextlib.contextmanager
 def log_nested(env, message):
   if env.config.debug_print_each_op:
-    print((' ' * log_nested.level) + message, file=sys.stderr)
+    print((" " * log_nested.level) + message, file=sys.stderr)
   log_nested.level += 1
   yield
   log_nested.level -= 1
 log_nested.level = 0
 class Tensor(torch.Tensor):
   @staticmethod
-  def __new__(cls, elem, env):
-    dtype = j2t_dtype(elem.dtype)
+  def __new__(cls, elem, env, requires_grad=False):
+    dtype = mappings.j2t_dtype(elem.dtype)
     shape = list(elem.shape)
     for i, s in enumerate(shape):
       if not isinstance(s, int):
         shape[i] = 1
     if dtype is None:
       dtype = torch.float32
+    #dispatch_keys = torch.DispatchKeySet(torch._C.DispatchKey.PrivateUse1).add(torch._C.DispatchKey.AutogradPrivateUse1)
+    if not (dtype.is_floating_point or dtype.is_complex):
+      requires_grad = False
     return torch.Tensor._make_wrapper_subclass(
         cls,
         shape,
         dtype=dtype,
         device='meta',
-        requires_grad=False,
+        requires_grad=requires_grad,
     )
-  def __init__(self, elem: jax.Array, env: 'Environment'):
+  def __init__(self, elem: jax.Array, env: "Environment", requires_grad=False):
     super().__init__()
     self._elem = elem
     self._env = env
@@ -88,12 +70,9 @@ class Tensor(torch.Tensor):
   __repr__ = __str__
-  def __jax_array__(self):
-    return self._elem
   @property
   def shape(self):
-    return self._elem.shape
+    return torch.Size(self._elem.shape)
   @property
   def ndim(self):
@@ -120,14 +99,15 @@ class Tensor(torch.Tensor):
   @classmethod
   def __torch_dispatch__(cls, func, types, args=(), kwargs=None):
-    env = None
-    for arg in torch_pytree.arg_tree_leaves(*args, **kwargs):
-      if isinstance(arg, Tensor):
-        env = arg._env
-        break
-    with env:
-      return func(*args, **(kwargs or {}))
+    # TODO(hanq): figure out why is dispatch mode not sufficient
+    if func == torch.ops._c10d_functional.wait_tensor.default:
+      return args[0]._env.dispatch(func, types, args, kwargs)
+    if func == torch.ops.prim.device.default:
+      return torch.device('privateuseone', 0)
+    raise AssertionError(
+        'torchax Tensors can only do math within the torchax environment.'
+        'Please wrap your code with `with torchax.default_env()` or '
+        'call torchax.enable_globally() before.')
   def detach(self):
     return Tensor(jax.lax.stop_gradient(self.jax()), self._env)
@@ -141,18 +121,18 @@ class Tensor(torch.Tensor):
     return self._elem
   def torch(self) -> torch.Tensor:
-    return j2t(self.jax())
+    return self._env.j2t_copy(self.jax())
   @property
   def dtype(self):
-    return j2t_dtype(self._elem.dtype)
+    return mappings.j2t_dtype(self._elem.dtype)
   def dim(self):
     return self.ndim
   @property
   def device(self):
-    return torch.device('jax:0')
+    return torch.device("jax:0")
   @property
   def jax_device(self):
@@ -160,7 +140,8 @@ class Tensor(torch.Tensor):
   @property
   def data(self):
-    logger.warn("In-place to .data modifications still results a copy on TPU")
+    logger.warning(
+        "In-place to .data modifications still results a copy on TPU")
     return self
   @data.setter
@@ -182,15 +163,15 @@ class Tensor(torch.Tensor):
   def shard_(self, sharding):
     self.apply_jax_(jax.lax.with_sharding_constraint, sharding)
 def debug_accuracy(func, args, kwargs, current_output):
   args_torch, kwargs_torch, out_torch = torch_pytree.tree_map_only(
-      torch.Tensor, lambda x: j2t(x._elem), (args, kwargs, current_output))
+      torch.Tensor, lambda x: x.torch(), (args, kwargs, current_output))
   with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
-    if 'device' in kwargs_torch:
-      kwargs_torch['device'] = 'cpu'  # do the torch native for comparison
+    if "device" in kwargs_torch:
+      kwargs_torch["device"] = "cpu"  # do the torch native for comparison
     expected_out = func(*args_torch, **kwargs_torch)
   flattened_current_out, _ = torch_pytree.tree_flatten(out_torch)
@@ -200,8 +181,8 @@ def debug_accuracy(func, args, kwargs, current_output):
     if isinstance(ex, torch.Tensor) and ex.dtype != real.dtype:
       ex = ex.to(real.dtype)
     try:
-      if (isinstance(ex, torch.Tensor) and
-          not torch.allclose(ex, real, atol=1e-3, equal_nan=True)):
+      if isinstance(ex, torch.Tensor) and not torch.allclose(
+          ex, real, atol=1e-3, equal_nan=True):
         import pdb
         pdb.set_trace()
@@ -212,46 +193,52 @@ def debug_accuracy(func, args, kwargs, current_output):
   return True
 def _make_debug_msg(is_dispatch, log_args, func, args, kwargs):
   def _display(a):
     if isinstance(a, torch.Tensor):
-      return f'Tensor of {type(a)}: {a.dtype}{a.shape}'
+      return f"Tensor of {type(a)}: {a.dtype}{a.shape}"
     elif isinstance(a, jax.Array):
-      return f'Jax Array of {type(a)}: {a.dtype}{a.shape}'
+      return f"Jax Array of {type(a)}: {a.dtype}{a.shape}"
     else:
       return str(a)
   kwargs = kwargs or {}
-  title = 'DISPATCH' if is_dispatch else 'FUNCTION'
-  args_msg = 'args: ' + ','.join(_display(a) for a in args) if log_args else ''
-  kwargs_msg = 'kwargs: ' + ','.join(f'{key}: {_display(a)}' for key, a in kwargs.items()) if log_args else ''
-  return f'{title}: {_name_of_func(func)} {args_msg} ~ {kwargs_msg}'
+  title = "DISPATCH" if is_dispatch else "FUNCTION"
+  args_msg = "args: " + ",".join(_display(a) for a in args) if log_args else ""
+  kwargs_msg = ("kwargs: " +
+                ",".join(f"{key}: {_display(a)}" for key, a in kwargs.items())
+                if log_args else "")
+  return f"{title}: {_name_of_func(func)} {args_msg} ~ {kwargs_msg}"
 class XLAFunctionMode(torch.overrides.TorchFunctionMode):
   """Context manager that dispatches torch function calls to JAX."""
   def __init__(self, env):
-     self.env = env
+    self.env = env
   def __torch_function__(self,
                          func,
                          types,
                          args=(),
                          kwargs=None) -> torch.Tensor:
-    message = f'FUNCTION: {_name_of_func(func)}'
+    message = f"FUNCTION: {_name_of_func(func)}"
     if self.env.config.debug_print_each_op_operands:
-      message = message + 'f'
-    message = _make_debug_msg(False, self.env.config.debug_print_each_op_operands,
+      message = message + "f"
+    message = _make_debug_msg(False,
+                              self.env.config.debug_print_each_op_operands,
                               func, args, kwargs)
     with log_nested(self.env, message):
       try:
         return self.env.dispatch(func, types, args, kwargs)
       except OperatorNotFound:
         pass
-      if _name_of_func(func) in ('rot90'): # skip rot90 with k%4==0 due to no change
+      if _name_of_func(func) in (
+          "rot90"):  # skip rot90 with k%4==0 due to no change
         if len(args) >= 2 and type(args[1]) == int:
-          if ((args[1])%4 == 0):
+          if (args[1]) % 4 == 0:
             return args[0]
       return func(*args, **(kwargs or {}))
@@ -262,296 +249,463 @@ class XLADispatchMode(torch_dispatch.TorchDispatchMode):
     self.env = env
   def __torch_dispatch__(self, func, types, args=(), kwargs=None):
-    message = _make_debug_msg(True, self.env.config.debug_print_each_op_operands,
+    message = _make_debug_msg(True,
+                              self.env.config.debug_print_each_op_operands,
                               func, args, kwargs)
     with log_nested(self.env, message):
       if isinstance(func, torch._ops.OpOverloadPacket):
         with self:
           return func(*args, **kwargs)
-      if func.namespace not in ('aten', '_c10d_functional', 'torchvision'):
+      # Only functions under these namespaces will be intercepted
+      if func.namespace not in (
+          "aten",
+          "_c10d_functional",
+          "torchvision",
+          "xla",
+      ):
         return func(*args, **kwargs)
       return self.env.dispatch(func, types, args, kwargs)
 def _name_of_func(func):
-  if hasattr(func, 'name'):
+  if hasattr(func, "name"):
     return func.name()
   return func.__name__
 # Constructors that don't take other tensor as input
 TENSOR_CONSTRUCTORS = {
-  torch.ones,
-  torch.zeros,
-  torch.empty,
-  torch.empty_strided,
-  torch.tensor,
-  torch.arange,
-  torch.eye,
-  torch.randn,
-  torch.rand,
-  torch.randint,
-  torch.full,
-  torch.as_tensor,
+    torch.ones,
+    torch.zeros,
+    torch.empty,
+    torch.empty_strided,
+    torch.tensor,
+    torch.arange,
+    torch.eye,
+    torch.randn,
+    torch.rand,
+    torch.randint,
+    torch.full,
+    torch.as_tensor,
 }
+# TODO(wen): use existing types, either from torch or jax
+SUPPORTED_JAX_PLATFROM = ["cpu", "tpu"]
-class Environment(contextlib.ContextDecorator):
-    """This class holds a set of configurations and "globals" needed
-    for executing torch program using jax.
-    Things included so far:
+class RuntimeProperty:
+  mesh: Any
+  prng: Any
+  autocast_dtype: Any
-    op registry
-    PRNGKey
-    Configs
+  def __init__(self, mesh, prng, autocast_dtype):
+    self.mesh = mesh
+    self.prng = prng
+    self.autocast_dtype = autocast_dtype
-    Also helper functions to manipulate those.
-    """
+  def override(self, **kwargs):
+    return OverrideProperty(self, kwargs)
+  def get_and_rotate_prng_key(self):
+    old_key = self.prng
+    new_prng_key, next_key = jax.random.split(old_key)
+    self.prng = new_prng_key
+    return next_key
+class OverrideProperty(RuntimeProperty):
-    _prng_key: jax.random.PRNGKey
+  def __init__(self, parent, override):
+    self.parent = parent
+    self._override = dict(override)
+  def __getattr__(self, name):
+    if name in self._override:
+      return self._override[name]
+    return getattr(self.parent, name)
-    def __init__(self, configuration=None):
-        self._function_mode = XLAFunctionMode(self)
-        self._dispatch_mode = XLADispatchMode(self)
-        # name is torch callable
-        self._ops = {}
-        self.load_ops()
+class Environment(contextlib.ContextDecorator):
+  """This class holds a set of configurations and "globals" needed
+  for executing torch program using jax.
+  Things included so far:
+  op registry
+  PRNGKey
+  Configs
-        self._mesh = None
-        self.config = configuration or config.Configuration()
+  Also helper functions to manipulate those.
+  """
-        self._manually_entered = False
-        self.enabled = False
-        self._jax_devices = set(['jax', 'jax_cpu', 'xla'])
+  def __init__(self, configuration=None):
+    self._function_mode = XLAFunctionMode(self)
+    self._dispatch_mode = XLADispatchMode(self)
-    def get_as_jax_device(self, device: Any):
-      if device is None:
-        device = torch.get_default_device()
+    # name is torch callable
+    self._ops = {}
+    self._decomps = {}
-      if isinstance(device, torch.device):
-        device = str(device)
+    self.load_ops()
-      if (not self.config.use_torch_native_for_cpu_tensor and
-          device.startswith('cpu')):
-        return jax.devices('cpu')[0]
+    _mesh = None
+    self.config = configuration or config.Configuration()
-      if self.config.treat_cuda_as_jax_device and device.startswith('cuda'):
-        return jax.local_devices()[0]
+    self.enabled = False
-      if device.startswith('jax'):
-        return jax.local_devices()[0]
+    autocast_dtype = None
-      return None # fallback to torch
+    _prng_key = jax.random.key(torch.initial_seed() % (1 << 63))
+    self._property = threading.local()
+    self._property.content = [
+        RuntimeProperty(
+            mesh=_mesh, prng=_prng_key, autocast_dtype=autocast_dtype)
+    ]
+  @property
+  def param(self):
+    return self._property.content[-1]
-    def load_ops(self):
-      from torchax.ops import jaten, jtorch, jc10d, jtorchvision_nms
-      self._ops.update(ops_registry.all_aten_ops)
-      self._ops.update(ops_registry.all_torch_functions)
+  def manual_seed(self, key):
+    jax_key = jax.random.PRNGKey(key)
+    new_prop = self.param.override(prng=jax_key)
+    self._property.content.append(new_prop)
-      decomps = torch._decomp.core_aten_decompositions()
-      from torchax.decompositions import EXTRA_DECOMP
-      decomps.update(EXTRA_DECOMP)
-      for k, v in decomps.items():
-        if k not in self._ops:
-          self._ops[k] = ops_registry.Operator(
+  @property
+  def prng_key(self):
+    return self.param.prng
+  def _should_use_torchax_tensor(self, device):
+    if device is None:
+      device = torch.get_default_device()
+    if isinstance(device, torch.device):
+      device = device.type
+    if ':' in device:
+      device = device.split(':')[0]
+    match device:
+      case 'cpu':
+        return False
+      case 'cuda':
+        return self.config.treat_cuda_as_jax_device
+      case 'jax':
+        return True
+      case 'privateuseone':
+        return True
+      case 'meta':
+        return self.enabled
+    return False
+  def load_ops(self):
+    from torchax.ops import jaten, jtorch, jc10d, jtorchvision_nms
+    for k, v in itertools.chain(ops_registry.all_aten_ops.items(),
+                                ops_registry.all_torch_functions.items()):
+      if v.is_jax_function:
+        self._ops[k] = v
+      else:
+        self._decomps[k] = v
+    from torchax.decompositions import DECOMPOSITIONS, MUTABLE_DECOMPOSITION
+    for k, v in DECOMPOSITIONS.items():
+      if k not in self._decomps:
+        self._decomps[k] = ops_registry.Operator(
             k,
             v,
             is_jax_function=False,
             is_user_defined=False,
-            needs_env=False
-          )
-    def _to_copy(self, the_tensor, new_dtype, new_device):
+            needs_env=False,
+            is_view_op=k in MUTABLE_DECOMPOSITION,
+        )
+  def _get_op_or_decomp(self, func):
+    def _get_from_dict(op_dict, op):
+      op = op_dict.get(func)
+      if op is None and isinstance(func, torch._ops.OpOverloadPacket):
+        op = op_dict.get(func.default)
+      if op is None and isinstance(func, torch._ops.OpOverload):
+        op = op_dict.get(func.overloadpacket)
+      return op
+    op = _get_from_dict(self._ops, func)
+    if op is None:
+      # fallback to decompose
+      op = _get_from_dict(self._decomps, func)
+    if op is None:
+      raise OperatorNotFound(
+          f"Operator with name {_name_of_func(func)} has no lowering")
+    return op
+  def _is_same_device(self, the_tensor, new_device):
+    if new_device is None:
+      return True
+    if new_device == 'meta' and the_tensor.device.type == 'jax':
+      return True
+    if the_tensor.device.type != new_device:
+      if the_tensor.device.type == 'cuda':
+        return self.config.treat_cuda_as_jax_device
+      return False
+    return True
+  def _to_copy(self, the_tensor, new_dtype, new_device):
+    if isinstance(the_tensor, View):
+      the_tensor = the_tensor.torch()
+    if isinstance(new_device, torch.device):
+      new_device = new_device.type
+    res = the_tensor
+    if not self._is_same_device(the_tensor, new_device):
       if isinstance(the_tensor, Tensor):
-        arr = the_tensor.jax()
-        if new_dtype is not None and new_dtype != arr.dtype:
-          arr = arr.astype(mappings.t2j_dtype(new_dtype))
-        if new_device is not None:
-          # convert xla tensor to other device
-          # only supported is CPU
-          if str(new_device).startswith('cpu'):
-            # converting to a non-jax device: let torch native handle it
-            torch_tensor = j2t(arr) if isinstance(the_tensor, Tensor) else arr
-            with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
-              return torch_tensor.to(new_device)
+        torch_tensor = self.j2t_copy(the_tensor._elem)
+        with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
+          return torch_tensor.to(device=new_device, dtype=new_dtype)
       else:
-        if new_dtype is not None and new_dtype != the_tensor.dtype:
-          with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
-            the_tensor = the_tensor.to(new_dtype)
-        jax_device = self.get_as_jax_device(new_device)
-        if jax_device:
-          arr = t2j(the_tensor)
-          arr = jax.device_put(arr, jax_device)
-        else:
-          with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
-            return the_tensor.to(new_device)
-      return Tensor(arr, self)
+        arr = self.t2j_copy(the_tensor)
+        res = Tensor(arr, self, the_tensor.requires_grad)
-    def get_and_rotate_prng_key(self, generator: Optional[torch.Generator]=None):
-      # Always use the default `randint` to get the next seed
+    if new_dtype is not None and new_dtype != the_tensor.dtype:
+      if isinstance(the_tensor, Tensor):
+        res = res.apply_jax(jnp.astype, mappings.t2j_dtype(new_dtype))
+      else:
+        with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
+          return the_tensor.to(device=new_device, dtype=new_dtype)
+    return res
+  def get_and_rotate_prng_key(self,
+                              generator: Optional[torch.Generator] = None):
+    if generator is not None:
+      return jax.random.PRNGKey(generator.initial_seed() % (2**63))
+    return self.param.get_and_rotate_prng_key()
+  def _handle_tensor_constructor(self, func, args, kwargs):
+    device = kwargs.get("device")
+    if self._should_use_torchax_tensor(device):
+      # don't set default device, let caller set it
+      requires_grad = kwargs.get("requires_grad", False)
+      op = self._get_op_or_decomp(func)
+      if op.needs_env:
+        kwargs['env'] = self
+      if op.is_jax_function:
+        (args, kwargs) = self.t2j_iso((args, kwargs))
+      res = op.func(*args, **kwargs)
+      if isinstance(res, jax.Array):
+        res = Tensor(res, self, requires_grad)
+      return res
+    else:
       with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
-        next_key = torch.randint(
-            0, 2**32, (), dtype=torch.uint32, generator=generator).numpy()
-      return jax.random.key(next_key)
+        return func(*args, **kwargs)
-    def _handle_tensor_constructor(self, func, args, kwargs):
-      device = kwargs.get('device')
-      jax_device = self.get_as_jax_device(device)
-      # TODO(qihqi) figure out better ways for device propagation
-      if not self._manually_entered and jax_device is None:
-        # let torch handle it
-        with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
-          return func(*args, **kwargs)
-      with jax.default_device(jax_device):
-        op = self._ops.get(func)
-        if op is None and isinstance(func, torch._ops.OpOverload):
-          op = self._ops.get(func.overloadpacket)
-        res = op.func(*args, **kwargs)
-        if isinstance(res, jax.Array):
-          res = Tensor(res, self)
-        return res
-    def _torch_Tensor_to(self, args, kwargs):
-      the_tensor = args[0]
-      args = args[1:]
-      if len(args) >= 1 and isinstance(args[0], torch.Tensor):
-        dtype = args[0].dtype
-        device = args[0].device
-        return self._to_copy(the_tensor, dtype, device)
-      device = kwargs.get('device')
-      dtype = kwargs.get('dtype')
-      # args like pin_memory etc that we will ignore
-      args = list(filter(lambda x: not isinstance(x, bool), args))
-      if len(args) >= 2:
-        device, dtype, *_ = args
-      elif len(args) == 1 and isinstance(args[0], torch.dtype):
-        dtype = args[0]
-      elif len(args) == 1:
-        device = args[0]
+  def _torch_Tensor_to(self, args, kwargs):
+    the_tensor = args[0]
+    args = args[1:]
+    if len(args) >= 1 and isinstance(args[0], torch.Tensor):
+      dtype = args[0].dtype
+      device = args[0].device
       return self._to_copy(the_tensor, dtype, device)
+    device = kwargs.get("device")
+    dtype = kwargs.get("dtype")
+    # args like pin_memory etc that we will ignore
+    args = list(filter(lambda x: not isinstance(x, bool), args))
+    if len(args) >= 2:
+      device, dtype, *_ = args
+    elif len(args) == 1 and isinstance(args[0], torch.dtype):
+      dtype = args[0]
+    elif len(args) == 1:
+      device = args[0]
+    return self._to_copy(the_tensor, dtype, device)
+  def dispatch(self, func, types, args, kwargs):
+    kwargs = kwargs or {}
+    if func in TENSOR_CONSTRUCTORS:
+      return self._handle_tensor_constructor(func, args, kwargs)
+    if func in (
+        torch.Tensor.to,
+        torch.ops.aten.lift_fresh.default,
+        torch.ops.aten._to_copy,
+        torch.ops.aten._to_copy.default,
+    ):
+      return self._torch_Tensor_to(args, kwargs)
+    # If the func doesn't act on Tensor, and is not a tensor constructor,
+    # We should skip and let torch handle it.
+    tensor_args = [
+        t for t in torch_pytree.tree_flatten(args)[0]
+        if isinstance(t, torch.Tensor)
+    ]
+    def is_not_torchax_tensor(x):
+      return not isinstance(x, Tensor) and not isinstance(x, View)
+    if tensor_args and all(is_not_torchax_tensor(t) for t in tensor_args):
+      res = func(*args, **kwargs)
+      return res
+    with jax.named_scope(_name_of_func(func)):
+      op = self._get_op_or_decomp(func)
-    def dispatch(self, func, types, args, kwargs):
+      old_args, old_kwargs = args, kwargs
+      with self._dispatch_mode:
+        args, kwargs = torch_pytree.tree_map_only(
+            torch.distributed._functional_collectives.AsyncCollectiveTensor,
+            torch.distributed._functional_collectives.wait_tensor,
+            (args, kwargs),
+        )
-      kwargs = kwargs or {}
-      if func in TENSOR_CONSTRUCTORS:
-        return self._handle_tensor_constructor(func, args, kwargs)
-      if func in (torch.Tensor.to, torch.ops.aten.lift_fresh.default ,torch.ops.aten._to_copy, torch.ops.aten._to_copy.default):
-        return self._torch_Tensor_to(args, kwargs)
+      try:
+        if not op.is_view_op:
+          args, kwargs = self.v2t_iso((args, kwargs))
-      # If the func doesn't act on Tensor, and is not a tensor constructor,
-      # We should skip and let torch handle it.
-      tensor_args = [t for t in torch_pytree.tree_flatten(args)[0] if isinstance(t, torch.Tensor)]
-      if tensor_args and all(not isinstance(t, Tensor) for t in tensor_args):
-        return func(*args, **kwargs)
+        with self:
+          if self.param.autocast_dtype is not None:
+            autocast_policy = amp.autocast_policy.get(func)
+            if autocast_policy is not None:
+              args, kwargs = amp.execute_policy(autocast_policy, args, kwargs,
+                                                self.param.autocast_dtype)
-      with jax.named_scope(_name_of_func(func)):
-        op = self._ops.get(func)
+        if op.is_jax_function:
+          args, kwargs = self.t2j_iso((args, kwargs))
+      except AssertionError:
+        if self.config.debug_mixed_tensor:
+          breakpoint()
+        else:
+          raise
-        if op is None and isinstance(func, torch._ops.OpOverloadPacket):
-          op = self._ops.get(func.default)
+      if op.needs_env:
+        kwargs["env"] = self
-        if op is None and isinstance(func, torch._ops.OpOverload):
-          op = self._ops.get(func.overloadpacket)
+      if op.is_jax_function:
+        res = op.func(*args, **kwargs)
+      else:
+        # enable dispatch mode because this op could be a composite autograd op
+        # meaning, it will decompose in C++
+        with self._dispatch_mode:
+          res = op.func(*args, **kwargs)
-        if op is None:
-          raise OperatorNotFound(
-            f'Operator with name {_name_of_func(func)} has no lowering')
+      if op.is_jax_function:
+        res = self.j2t_iso(res)
-        old_args, old_kwargs = args, kwargs
-        args, kwargs = torch_pytree.tree_map_only(
-            torch.distributed._functional_collectives.AsyncCollectiveTensor,
-            torch.distributed._functional_collectives.wait_tensor,
-            (args, kwargs))
-        try:
-          if op.is_jax_function:
-            args, kwargs = self.t2j_iso((args, kwargs))
-        except AssertionError:
-          if self.config.debug_mixed_tensor:
-            import pdb; pdb.set_trace()
-          else:
-            raise
+      if self.config.force_materialize_views and isinstance(res, View):
+        res = res.torch()
+      if self.config.debug_accuracy_for_each_op:
+        debug_accuracy(func, old_args, old_kwargs, res)
+      return res
-        if op.needs_env:
-          kwargs['env'] = self
+  def enable_torch_modes(self):
+    self._dispatch_mode.__enter__()
+    self._function_mode.__enter__()
+    self.enabled = True
-        with self:
-          res = op.func(*args, **kwargs)
+  def disable_torch_modes(self, *exc):
+    if not exc:
+      exc = (None, None, None)
+    self._function_mode.__exit__(*exc)
+    self._dispatch_mode.__exit__(*exc)
+    self.enabled = False
-        if op.is_jax_function:
-          res = self.j2t_iso(res)
+  def __enter__(self):
+    self.enable_torch_modes()
+    return self
-        if self.config.debug_accuracy_for_each_op:
-          debug_accuracy(func, old_args, old_kwargs, res)
-        return res
+  def __exit__(self, *exc):
+    self.disable_torch_modes(*exc)
-    def enable_torch_modes(self):
-      self._dispatch_mode.__enter__()
-      self._function_mode.__enter__()
-      self.enabled = True
-    def disable_torch_modes(self, *exc):
-      if not exc:
-        exc = (None, None, None)
-      self._function_mode.__exit__(*exc)
-      self._dispatch_mode.__exit__(*exc)
-      self.enabled = False
-    def __enter__(self):
-      self.enable_torch_modes()
-      self._manually_entered = True
-      return self
-    def __exit__(self, *exc):
-      self._manually_entered = False
-      self.disable_torch_modes(*exc)
-    def _move_one_value(self, val):
-      if isinstance(val, torch.nn.Module):
-        with self:
-          return val.to('jax')
-      if isinstance(val, Tensor):
-        return val
-      if isinstance(val, torch.Tensor):
-        return Tensor(t2j(val), self)
+  def _move_one_value(self, val):
+    if isinstance(val, torch.nn.Module):
+      with self:
+        return val.to("jax")
+    if isinstance(val, Tensor):
       return val
+    if isinstance(val, torch.Tensor):
+      return Tensor(self.t2j_copy(val), self)
+    return val
-    def to_xla(self, torchvalues):
-      # tensors are torch.Tensors (not XLATensor)
-      res = torch_pytree.tree_map(
-        self._move_one_value,
-          torchvalues)
-      return res
+  def to_xla(self, torchvalues):
+    # tensors are torch.Tensors (not XLATensor)
+    res = torch_pytree.tree_map(self._move_one_value, torchvalues)
+    return res
+  def t2j_iso(self, torchtensors):
+    """Convert torchax Tensor to jax array.
+    This function will not copy, will just unwrap the inner jax array out.
+    Note: iso is short for "isomorphic"
+    """
+    def to_jax(x):
+      if self.config.allow_mixed_math_with_scalar_tensor and not isinstance(
+          x, Tensor):
+        if x.squeeze().ndim == 0:
+          return x.item()
+      if isinstance(
+          x, torch.distributed._functional_collectives.AsyncCollectiveTensor):
+        x = x.wait()
+      assert isinstance(x, Tensor) or isinstance(x, View), (
+          f"Expect a Tensor or a View but got {type(x)}; usually this means there is a mixed math between XLATensor and torch.Tensor"
+      )
+      return x.jax()
+    res = torch_pytree.tree_map_only(torch.Tensor, to_jax, torchtensors)
+    return res
-    def t2j_iso(self, torchtensors):
-      def to_jax(x):
-        if isinstance(x, torch.distributed._functional_collectives.AsyncCollectiveTensor):
-          x = x.wait()
-        assert isinstance(x, Tensor), f'Expect a Tensor but got {type(x)}; usually this means there is a mixed math between XLATensor and torch.Tensor'
-        return x.jax()
-      return torch_pytree.tree_map_only(torch.Tensor, to_jax, torchtensors)
+  def v2t_iso(self, views):
-    def j2t_iso(self, jaxarray):
-      return torch_pytree.tree_map_only(
-        jnp.ndarray, lambda x: Tensor(x, self), jaxarray)
+    def to_tensor(x):
+      if isinstance(x, View):
+        return x.torch()
+      return x
-    def j2t_copy(self, args):
-      pass
+    res = torch_pytree.tree_map_only(View, to_tensor, views)
+    return res
-    def override_op_definition(self, op_to_override, op_impl):
-      self._ops[op_to_override] = ops_registry.Operator(
+  def j2t_iso(self, jaxarray):
+    """Convert jax array to torchax Tensor.
+    This function will not copy, will just wrap the jax array with a torchax Tensor
+    Note: iso is short for "isomorphic"
+    """
+    return torch_pytree.tree_map_only(jax.Array, lambda x: Tensor(x, self),
+                                      jaxarray)
+  def j2t_copy(self, args):
+    """Convert torch.Tensor in cpu to a jax array
+    This might involves copying the data (depending if dlpack is enabled)
+    """
+    return torch_pytree.tree_map_only(
+        jax.Array,
+        lambda x: mappings.j2t(x, self.config.use_dlpack_for_data_conversion),
+        args)
+  def t2j_copy(self, args):
+    """Convert jax array to torch.Tensor in cpu.
+    This might involves copying the data (depending if dlpack is enabled)
+    """
+    return torch_pytree.tree_map_only(
+        torch.Tensor,
+        lambda x: mappings.t2j(x, self.config.use_dlpack_for_data_conversion),
+        args)
+  def override_op_definition(self, op_to_override, op_impl):
+    self._ops[op_to_override] = ops_registry.Operator(
         op_to_override,
         op_impl,
         is_jax_function=False,
         is_user_defined=True,
-        needs_env=False
-      )
+        needs_env=False,
+    )
+  @contextlib.contextmanager
+  def override_property(self, **kwargs):
+    new_prop = self.param.override(**kwargs)
+    self._property.content.append(new_prop)
+    yield
+    self._property.content.pop()

torchax 0.0.4__py3-none-any.whl → 0.0.6__py3-none-any.whl

Potentially problematic release.

torchax 0.0.4py3-none-any.whl → 0.0.6py3-none-any.whl