PyPI - torchax - Versions diffs - 0.0.4__py3-none-any.whl → 0.0.5__py3-none-any.whl - Mend

torchax 0.0.4py3-none-any.whl → 0.0.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of torchax might be problematic. Click here for more details.

Files changed (31) hide show

torchax/CONTRIBUTING.md +2 -2
torchax/__init__.py +57 -19
torchax/amp.py +333 -0
torchax/config.py +19 -12
torchax/decompositions.py +663 -195
torchax/device_module.py +7 -1
torchax/distributed.py +55 -60
torchax/export.py +26 -17
torchax/flax.py +39 -0
torchax/interop.py +275 -141
torchax/mesh_util.py +211 -0
torchax/ops/jaten.py +1718 -1294
torchax/ops/jax_reimplement.py +23 -21
torchax/ops/jc10d.py +5 -4
torchax/ops/jimage.py +113 -0
torchax/ops/jlibrary.py +9 -2
torchax/ops/jtorch.py +219 -78
torchax/ops/jtorchvision_nms.py +32 -43
torchax/ops/mappings.py +77 -35
torchax/ops/op_base.py +59 -32
torchax/ops/ops_registry.py +40 -35
torchax/tensor.py +417 -275
torchax/train.py +38 -41
torchax/util.py +88 -0
torchax/view.py +377 -0
{torchax-0.0.4.dist-info → torchax-0.0.5.dist-info}/METADATA +111 -145
torchax-0.0.5.dist-info/RECORD +32 -0
torchax/environment.py +0 -2
torchax-0.0.4.dist-info/RECORD +0 -27
{torchax-0.0.4.dist-info → torchax-0.0.5.dist-info}/WHEEL +0 -0
{torchax-0.0.4.dist-info → torchax-0.0.5.dist-info}/licenses/LICENSE +0 -0

torchax/tensor.py CHANGED Viewed

@@ -5,15 +5,18 @@ from typing import Optional, Any
 import jax
 import jax.numpy as jnp
 import numpy
+import itertools
 import torch
 import torch.distributed._functional_collectives
 import torch.func
 import torch.utils._mode_utils as mode_utils
 import torch.utils._python_dispatch as torch_dispatch
 import torch.utils._pytree as torch_pytree
+from torchax.view import View
 from torchax import config
 from torchax.ops import mappings, ops_registry
+from torchax import amp
+from jax.experimental import mutable_array
 logger = logging.getLogger(__name__)
@@ -30,32 +33,15 @@ def unwrap(torchtensors):
   return torch_pytree.tree_map_only(Tensor, lambda x: x._elem, torchtensors)
-def t2j(t):
-  if isinstance(t, Tensor):
-    return t._elem
-  return mappings.t2j(t)
-def j2t(x):
-  return mappings.j2t(x)
-def t2j_dtype(dtype):
-  return mappings.t2j_dtype(dtype)
-def j2t_dtype(dtype):
-  return mappings.j2t_dtype(dtype)
 @contextlib.contextmanager
 def log_nested(env, message):
   if env.config.debug_print_each_op:
-    print((' ' * log_nested.level) + message, file=sys.stderr)
+    print((" " * log_nested.level) + message, file=sys.stderr)
   log_nested.level += 1
   yield
   log_nested.level -= 1
 log_nested.level = 0
@@ -63,7 +49,7 @@ class Tensor(torch.Tensor):
   @staticmethod
   def __new__(cls, elem, env):
-    dtype = j2t_dtype(elem.dtype)
+    dtype = mappings.j2t_dtype(elem.dtype)
     shape = list(elem.shape)
     for i, s in enumerate(shape):
       if not isinstance(s, int):
@@ -74,11 +60,11 @@ class Tensor(torch.Tensor):
         cls,
         shape,
         dtype=dtype,
-        device='meta',
+        device="meta",
         requires_grad=False,
     )
-  def __init__(self, elem: jax.Array, env: 'Environment'):
+  def __init__(self, elem: jax.Array, env: "Environment"):
     super().__init__()
     self._elem = elem
     self._env = env
@@ -93,7 +79,7 @@ class Tensor(torch.Tensor):
   @property
   def shape(self):
-    return self._elem.shape
+    return torch.Size(self._elem.shape)
   @property
   def ndim(self):
@@ -120,14 +106,13 @@ class Tensor(torch.Tensor):
   @classmethod
   def __torch_dispatch__(cls, func, types, args=(), kwargs=None):
-    env = None
-    for arg in torch_pytree.arg_tree_leaves(*args, **kwargs):
-      if isinstance(arg, Tensor):
-        env = arg._env
-        break
-    with env:
-      return func(*args, **(kwargs or {}))
+    # TODO(hanq): figure out why is dispatch mode not sufficient
+    if func == torch.ops._c10d_functional.wait_tensor.default:
+      return args[0]._env.dispatch(func, types, args, kwargs)
+    raise AssertionError(
+        'torchax Tensors can only do math within the torchax environment.'
+        'Please wrap your code with `with torchax.default_env()` or '
+        'call torchax.enable_globally() before.')
   def detach(self):
     return Tensor(jax.lax.stop_gradient(self.jax()), self._env)
@@ -141,18 +126,18 @@ class Tensor(torch.Tensor):
     return self._elem
   def torch(self) -> torch.Tensor:
-    return j2t(self.jax())
+    return self._env.j2t_copy(self.jax())
   @property
   def dtype(self):
-    return j2t_dtype(self._elem.dtype)
+    return mappings.j2t_dtype(self._elem.dtype)
   def dim(self):
     return self.ndim
   @property
   def device(self):
-    return torch.device('jax:0')
+    return torch.device("jax:0")
   @property
   def jax_device(self):
@@ -160,7 +145,8 @@ class Tensor(torch.Tensor):
   @property
   def data(self):
-    logger.warn("In-place to .data modifications still results a copy on TPU")
+    logger.warning(
+        "In-place to .data modifications still results a copy on TPU")
     return self
   @data.setter
@@ -182,15 +168,15 @@ class Tensor(torch.Tensor):
   def shard_(self, sharding):
     self.apply_jax_(jax.lax.with_sharding_constraint, sharding)
 def debug_accuracy(func, args, kwargs, current_output):
   args_torch, kwargs_torch, out_torch = torch_pytree.tree_map_only(
-      torch.Tensor, lambda x: j2t(x._elem), (args, kwargs, current_output))
+      torch.Tensor, lambda x: x.torch(), (args, kwargs, current_output))
   with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
-    if 'device' in kwargs_torch:
-      kwargs_torch['device'] = 'cpu'  # do the torch native for comparison
+    if "device" in kwargs_torch:
+      kwargs_torch["device"] = "cpu"  # do the torch native for comparison
     expected_out = func(*args_torch, **kwargs_torch)
   flattened_current_out, _ = torch_pytree.tree_flatten(out_torch)
@@ -200,8 +186,8 @@ def debug_accuracy(func, args, kwargs, current_output):
     if isinstance(ex, torch.Tensor) and ex.dtype != real.dtype:
       ex = ex.to(real.dtype)
     try:
-      if (isinstance(ex, torch.Tensor) and
-          not torch.allclose(ex, real, atol=1e-3, equal_nan=True)):
+      if isinstance(ex, torch.Tensor) and not torch.allclose(
+          ex, real, atol=1e-3, equal_nan=True):
         import pdb
         pdb.set_trace()
@@ -212,46 +198,52 @@ def debug_accuracy(func, args, kwargs, current_output):
   return True
 def _make_debug_msg(is_dispatch, log_args, func, args, kwargs):
   def _display(a):
     if isinstance(a, torch.Tensor):
-      return f'Tensor of {type(a)}: {a.dtype}{a.shape}'
+      return f"Tensor of {type(a)}: {a.dtype}{a.shape}"
     elif isinstance(a, jax.Array):
-      return f'Jax Array of {type(a)}: {a.dtype}{a.shape}'
+      return f"Jax Array of {type(a)}: {a.dtype}{a.shape}"
     else:
       return str(a)
   kwargs = kwargs or {}
-  title = 'DISPATCH' if is_dispatch else 'FUNCTION'
-  args_msg = 'args: ' + ','.join(_display(a) for a in args) if log_args else ''
-  kwargs_msg = 'kwargs: ' + ','.join(f'{key}: {_display(a)}' for key, a in kwargs.items()) if log_args else ''
-  return f'{title}: {_name_of_func(func)} {args_msg} ~ {kwargs_msg}'
+  title = "DISPATCH" if is_dispatch else "FUNCTION"
+  args_msg = "args: " + ",".join(_display(a) for a in args) if log_args else ""
+  kwargs_msg = ("kwargs: " +
+                ",".join(f"{key}: {_display(a)}" for key, a in kwargs.items())
+                if log_args else "")
+  return f"{title}: {_name_of_func(func)} {args_msg} ~ {kwargs_msg}"
 class XLAFunctionMode(torch.overrides.TorchFunctionMode):
   """Context manager that dispatches torch function calls to JAX."""
   def __init__(self, env):
-     self.env = env
+    self.env = env
   def __torch_function__(self,
                          func,
                          types,
                          args=(),
                          kwargs=None) -> torch.Tensor:
-    message = f'FUNCTION: {_name_of_func(func)}'
+    message = f"FUNCTION: {_name_of_func(func)}"
     if self.env.config.debug_print_each_op_operands:
-      message = message + 'f'
-    message = _make_debug_msg(False, self.env.config.debug_print_each_op_operands,
+      message = message + "f"
+    message = _make_debug_msg(False,
+                              self.env.config.debug_print_each_op_operands,
                               func, args, kwargs)
     with log_nested(self.env, message):
       try:
         return self.env.dispatch(func, types, args, kwargs)
       except OperatorNotFound:
         pass
-      if _name_of_func(func) in ('rot90'): # skip rot90 with k%4==0 due to no change
+      if _name_of_func(func) in (
+          "rot90"):  # skip rot90 with k%4==0 due to no change
         if len(args) >= 2 and type(args[1]) == int:
-          if ((args[1])%4 == 0):
+          if (args[1]) % 4 == 0:
             return args[0]
       return func(*args, **(kwargs or {}))
@@ -262,296 +254,446 @@ class XLADispatchMode(torch_dispatch.TorchDispatchMode):
     self.env = env
   def __torch_dispatch__(self, func, types, args=(), kwargs=None):
-    message = _make_debug_msg(True, self.env.config.debug_print_each_op_operands,
+    message = _make_debug_msg(True,
+                              self.env.config.debug_print_each_op_operands,
                               func, args, kwargs)
     with log_nested(self.env, message):
       if isinstance(func, torch._ops.OpOverloadPacket):
         with self:
           return func(*args, **kwargs)
-      if func.namespace not in ('aten', '_c10d_functional', 'torchvision'):
+      # Only functions under these namespaces will be intercepted
+      if func.namespace not in (
+          "aten",
+          "_c10d_functional",
+          "torchvision",
+          "xla",
+      ):
         return func(*args, **kwargs)
       return self.env.dispatch(func, types, args, kwargs)
 def _name_of_func(func):
-  if hasattr(func, 'name'):
+  if hasattr(func, "name"):
     return func.name()
   return func.__name__
 # Constructors that don't take other tensor as input
 TENSOR_CONSTRUCTORS = {
-  torch.ones,
-  torch.zeros,
-  torch.empty,
-  torch.empty_strided,
-  torch.tensor,
-  torch.arange,
-  torch.eye,
-  torch.randn,
-  torch.rand,
-  torch.randint,
-  torch.full,
-  torch.as_tensor,
+    torch.ones,
+    torch.zeros,
+    torch.empty,
+    torch.empty_strided,
+    torch.tensor,
+    torch.arange,
+    torch.eye,
+    torch.randn,
+    torch.rand,
+    torch.randint,
+    torch.full,
+    torch.as_tensor,
 }
+# TODO(wen): use existing types, either from torch or jax
+SUPPORTED_JAX_PLATFROM = ["cpu", "tpu"]
-class Environment(contextlib.ContextDecorator):
-    """This class holds a set of configurations and "globals" needed
-    for executing torch program using jax.
-    Things included so far:
-    op registry
-    PRNGKey
-    Configs
-    Also helper functions to manipulate those.
-    """
+class Environment(contextlib.ContextDecorator):
+  """This class holds a set of configurations and "globals" needed
-    _prng_key: jax.random.PRNGKey
+  for executing torch program using jax.
+  Things included so far:
+  op registry
+  PRNGKey
+  Configs
-    def __init__(self, configuration=None):
-        self._function_mode = XLAFunctionMode(self)
-        self._dispatch_mode = XLADispatchMode(self)
+  Also helper functions to manipulate those.
+  """
-        # name is torch callable
-        self._ops = {}
-        self.load_ops()
+  def __init__(self, configuration=None):
+    self._function_mode = XLAFunctionMode(self)
+    self._dispatch_mode = XLADispatchMode(self)
-        self._mesh = None
-        self.config = configuration or config.Configuration()
+    # name is torch callable
+    self._ops = {}
+    self._decomps = {}
-        self._manually_entered = False
-        self.enabled = False
-        self._jax_devices = set(['jax', 'jax_cpu', 'xla'])
+    self.load_ops()
-    def get_as_jax_device(self, device: Any):
-      if device is None:
-        device = torch.get_default_device()
+    self._mesh = None
+    self.config = configuration or config.Configuration()
-      if isinstance(device, torch.device):
-        device = str(device)
+    self._manually_entered = False
+    self.enabled = False
-      if (not self.config.use_torch_native_for_cpu_tensor and
-          device.startswith('cpu')):
-        return jax.devices('cpu')[0]
+    self._prng_key = mutable_array(
+        jax.random.key(torch.initial_seed() % (1 << 63)))
+    self.autocast_dtype = None
+    self._target_device = jax.local_devices()[0].platform
-      if self.config.treat_cuda_as_jax_device and device.startswith('cuda'):
-        return jax.local_devices()[0]
+  @property
+  def target_device(self):
+    return self._target_device
-      if device.startswith('jax'):
-        return jax.local_devices()[0]
+  @target_device.setter
+  def target_device(self, device: str):
+    self._target_device = device.lower()
-      return None # fallback to torch
+  def manual_seed(self, key):
+    self._prng_key = mutable_array(jax.random.key(key))
+  @property
+  def prng_key(self):
+    return self._prng_key[...]
+  def get_as_jax_device(self, device: Any):
+    if device is None:
+      device = torch.get_default_device()
+    if isinstance(device, torch.device):
+      device = str(device)
+    if not self.config.use_torch_native_for_cpu_tensor and device.startswith(
+        "cpu"):
+      return jax.devices("cpu")[0]
+    if self.config.treat_cuda_as_jax_device and device.startswith("cuda"):
+      return jax.local_devices()[0]
+    if device.startswith("xla"):
+      return jax.local_devices()[0]
+    # TODO (wen): jax is NOT a device type,
+    # once we can register more than one backend, revisit
+    if device.startswith("jax"):
+      match self.target_device:
+        case "cpu":
+          return jax.devices("cpu")[0]
+        case "tpu":
+          return jax.devices("tpu")[0]
+        case _:
+          raise AttributeError(
+              f"Cannot handle env.target_device {self.target_device}")
+    return None  # fallback to torch
+  def load_ops(self):
+    from torchax.ops import jaten, jtorch, jc10d, jtorchvision_nms
+    for k, v in itertools.chain(ops_registry.all_aten_ops.items(),
+                                ops_registry.all_torch_functions.items()):
+      if v.is_jax_function:
+        self._ops[k] = v
+      else:
+        self._decomps[k] = v
-    def load_ops(self):
-      from torchax.ops import jaten, jtorch, jc10d, jtorchvision_nms
-      self._ops.update(ops_registry.all_aten_ops)
-      self._ops.update(ops_registry.all_torch_functions)
+    from torchax.decompositions import DECOMPOSITIONS, MUTABLE_DECOMPOSITION
-      decomps = torch._decomp.core_aten_decompositions()
-      from torchax.decompositions import EXTRA_DECOMP
-      decomps.update(EXTRA_DECOMP)
-      for k, v in decomps.items():
-        if k not in self._ops:
-          self._ops[k] = ops_registry.Operator(
+    for k, v in DECOMPOSITIONS.items():
+      if k not in self._decomps:
+        self._decomps[k] = ops_registry.Operator(
             k,
             v,
             is_jax_function=False,
             is_user_defined=False,
-            needs_env=False
-          )
-    def _to_copy(self, the_tensor, new_dtype, new_device):
-      if isinstance(the_tensor, Tensor):
-        arr = the_tensor.jax()
-        if new_dtype is not None and new_dtype != arr.dtype:
-          arr = arr.astype(mappings.t2j_dtype(new_dtype))
-        if new_device is not None:
-          # convert xla tensor to other device
-          # only supported is CPU
-          if str(new_device).startswith('cpu'):
+            needs_env=False,
+            is_view_op=k in MUTABLE_DECOMPOSITION,
+        )
+  def _get_op_or_decomp(self, func):
+    def _get_from_dict(op_dict, op):
+      op = op_dict.get(func)
+      if op is None and isinstance(func, torch._ops.OpOverloadPacket):
+        op = op_dict.get(func.default)
+      if op is None and isinstance(func, torch._ops.OpOverload):
+        op = op_dict.get(func.overloadpacket)
+      return op
+    op = _get_from_dict(self._ops, func)
+    if op is None:
+      # fallback to decompose
+      op = _get_from_dict(self._decomps, func)
+    if op is None:
+      raise OperatorNotFound(
+          f"Operator with name {_name_of_func(func)} has no lowering")
+    return op
+  def _to_copy(self, the_tensor, new_dtype, new_device):
+    if isinstance(the_tensor, View):
+      the_tensor = the_tensor.torch()
+    if isinstance(the_tensor, Tensor):
+      arr = the_tensor.jax()
+      if new_dtype is not None and new_dtype != arr.dtype:
+        arr = arr.astype(mappings.t2j_dtype(new_dtype))
+      if new_device is not None:
+        match str(new_device).lower():
+          case "cpu":
             # converting to a non-jax device: let torch native handle it
-            torch_tensor = j2t(arr) if isinstance(the_tensor, Tensor) else arr
+            torch_tensor = self.j2t_copy(arr) if isinstance(the_tensor,
+                                                            Tensor) else arr
             with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
               return torch_tensor.to(new_device)
+          case "jax":
+            # move torchax.tensor / jax tensor between devices
+            # I don't know ifgit  this will work after the model is jitted
+            if self.target_device != the_tensor.jax_device.platform:
+              arr = jax.device_put(the_tensor.jax(),
+                                   jax.devices(self.target_device)[0])
+              return Tensor(arr, self)
+          case _:
+            logging.error(f"torchax.Tenosr cannot handle device {new_device}")
+    else:
+      if new_dtype is not None and new_dtype != the_tensor.dtype:
+        with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
+          the_tensor = the_tensor.to(new_dtype)
+      if new_device is None:  ## device is None means don't change device
+        return the_tensor
+      jax_device = self.get_as_jax_device(new_device)
+      if jax_device:
+        arr = self.t2j_copy(the_tensor)
+        arr = jax.device_put(arr, jax_device)
       else:
-        if new_dtype is not None and new_dtype != the_tensor.dtype:
-          with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
-            the_tensor = the_tensor.to(new_dtype)
-        jax_device = self.get_as_jax_device(new_device)
-        if jax_device:
-          arr = t2j(the_tensor)
-          arr = jax.device_put(arr, jax_device)
-        else:
-          with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
-            return the_tensor.to(new_device)
+        with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
+          return the_tensor.to(new_device)
-      return Tensor(arr, self)
+    return Tensor(arr, self)
-    def get_and_rotate_prng_key(self, generator: Optional[torch.Generator]=None):
-      # Always use the default `randint` to get the next seed
+  def get_and_rotate_prng_key(self,
+                              generator: Optional[torch.Generator] = None):
+    if generator is not None:
       with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
-        next_key = torch.randint(
-            0, 2**32, (), dtype=torch.uint32, generator=generator).numpy()
-      return jax.random.key(next_key)
+        self._prng_key[...] = jax.random.key(generator.initial_seed() % (2**63))
+    old_key = self._prng_key[...]
+    new_prng_key, next_key = jax.random.split(old_key)
+    self._prng_key[...] = new_prng_key
+    return next_key
+  def _handle_tensor_constructor(self, func, args, kwargs):
+    device = kwargs.get("device")
+    jax_device = self.get_as_jax_device(device)
+    # TODO(qihqi) figure out better ways for device propagation
+    if not self._manually_entered and jax_device is None:
+      # let torch handle it
+      with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
+        return func(*args, **kwargs)
+    with jax.default_device(jax_device):
+      requires_grad = kwargs.get("requires_grad", False)
+      op = self._get_op_or_decomp(func)
+      res = op.func(*args, **kwargs)
+      if isinstance(res, jax.Array):
+        res = Tensor(res, self)
+      if requires_grad:
+        res.requires_grad = True
+      return res
-    def _handle_tensor_constructor(self, func, args, kwargs):
-      device = kwargs.get('device')
-      jax_device = self.get_as_jax_device(device)
-      # TODO(qihqi) figure out better ways for device propagation
-      if not self._manually_entered and jax_device is None:
-        # let torch handle it
-        with mode_utils.no_dispatch(), torch._C.DisableTorchFunction():
-          return func(*args, **kwargs)
-      with jax.default_device(jax_device):
-        op = self._ops.get(func)
-        if op is None and isinstance(func, torch._ops.OpOverload):
-          op = self._ops.get(func.overloadpacket)
-        res = op.func(*args, **kwargs)
-        if isinstance(res, jax.Array):
-          res = Tensor(res, self)
-        return res
-    def _torch_Tensor_to(self, args, kwargs):
-      the_tensor = args[0]
-      args = args[1:]
-      if len(args) >= 1 and isinstance(args[0], torch.Tensor):
-        dtype = args[0].dtype
-        device = args[0].device
-        return self._to_copy(the_tensor, dtype, device)
-      device = kwargs.get('device')
-      dtype = kwargs.get('dtype')
-      # args like pin_memory etc that we will ignore
-      args = list(filter(lambda x: not isinstance(x, bool), args))
-      if len(args) >= 2:
-        device, dtype, *_ = args
-      elif len(args) == 1 and isinstance(args[0], torch.dtype):
-        dtype = args[0]
-      elif len(args) == 1:
-        device = args[0]
+  def _torch_Tensor_to(self, args, kwargs):
+    the_tensor = args[0]
+    args = args[1:]
+    if len(args) >= 1 and isinstance(args[0], torch.Tensor):
+      dtype = args[0].dtype
+      device = args[0].device
       return self._to_copy(the_tensor, dtype, device)
+    device = kwargs.get("device")
+    dtype = kwargs.get("dtype")
+    # args like pin_memory etc that we will ignore
+    args = list(filter(lambda x: not isinstance(x, bool), args))
+    if len(args) >= 2:
+      device, dtype, *_ = args
+    elif len(args) == 1 and isinstance(args[0], torch.dtype):
+      dtype = args[0]
+    elif len(args) == 1:
+      device = args[0]
+    return self._to_copy(the_tensor, dtype, device)
+  def dispatch(self, func, types, args, kwargs):
+    kwargs = kwargs or {}
+    if func in TENSOR_CONSTRUCTORS:
+      return self._handle_tensor_constructor(func, args, kwargs)
+    if func in (
+        torch.Tensor.to,
+        torch.ops.aten.lift_fresh.default,
+        torch.ops.aten._to_copy,
+        torch.ops.aten._to_copy.default,
+    ):
+      return self._torch_Tensor_to(args, kwargs)
+    # If the func doesn't act on Tensor, and is not a tensor constructor,
+    # We should skip and let torch handle it.
+    tensor_args = [
+        t for t in torch_pytree.tree_flatten(args)[0]
+        if isinstance(t, torch.Tensor)
+    ]
+    def is_not_torchax_tensor(x):
+      return not isinstance(x, Tensor) and not isinstance(x, View)
+    if tensor_args and all(is_not_torchax_tensor(t) for t in tensor_args):
+      res = func(*args, **kwargs)
+      return res
+    with jax.named_scope(_name_of_func(func)):
+      op = self._get_op_or_decomp(func)
-    def dispatch(self, func, types, args, kwargs):
+      old_args, old_kwargs = args, kwargs
+      with self._dispatch_mode:
+        args, kwargs = torch_pytree.tree_map_only(
+            torch.distributed._functional_collectives.AsyncCollectiveTensor,
+            torch.distributed._functional_collectives.wait_tensor,
+            (args, kwargs),
+        )
-      kwargs = kwargs or {}
-      if func in TENSOR_CONSTRUCTORS:
-        return self._handle_tensor_constructor(func, args, kwargs)
-      if func in (torch.Tensor.to, torch.ops.aten.lift_fresh.default ,torch.ops.aten._to_copy, torch.ops.aten._to_copy.default):
-        return self._torch_Tensor_to(args, kwargs)
+      try:
+        if not op.is_view_op:
+          args, kwargs = self.v2t_iso((args, kwargs))
-      # If the func doesn't act on Tensor, and is not a tensor constructor,
-      # We should skip and let torch handle it.
-      tensor_args = [t for t in torch_pytree.tree_flatten(args)[0] if isinstance(t, torch.Tensor)]
-      if tensor_args and all(not isinstance(t, Tensor) for t in tensor_args):
-        return func(*args, **kwargs)
+        with self:
+          if self.autocast_dtype is not None:
+            autocast_policy = amp.autocast_policy.get(func)
+            if autocast_policy is not None:
+              args, kwargs = amp.execute_policy(autocast_policy, args, kwargs,
+                                                self.autocast_dtype)
-      with jax.named_scope(_name_of_func(func)):
-        op = self._ops.get(func)
+        if op.is_jax_function:
+          args, kwargs = self.t2j_iso((args, kwargs))
+      except AssertionError:
+        if self.config.debug_mixed_tensor:
+          breakpoint()
+        else:
+          raise
-        if op is None and isinstance(func, torch._ops.OpOverloadPacket):
-          op = self._ops.get(func.default)
+      if op.needs_env:
+        kwargs["env"] = self
-        if op is None and isinstance(func, torch._ops.OpOverload):
-          op = self._ops.get(func.overloadpacket)
+      if op.is_jax_function:
+        res = op.func(*args, **kwargs)
+      else:
+        # enable dispatch mode because this op could be a composite autograd op
+        # meaning, it will decompose in C++
+        with self._dispatch_mode:
+          res = op.func(*args, **kwargs)
-        if op is None:
-          raise OperatorNotFound(
-            f'Operator with name {_name_of_func(func)} has no lowering')
+      if op.is_jax_function:
+        res = self.j2t_iso(res)
-        old_args, old_kwargs = args, kwargs
-        args, kwargs = torch_pytree.tree_map_only(
-            torch.distributed._functional_collectives.AsyncCollectiveTensor,
-            torch.distributed._functional_collectives.wait_tensor,
-            (args, kwargs))
-        try:
-          if op.is_jax_function:
-            args, kwargs = self.t2j_iso((args, kwargs))
-        except AssertionError:
-          if self.config.debug_mixed_tensor:
-            import pdb; pdb.set_trace()
-          else:
-            raise
+      if self.config.force_materialize_views and isinstance(res, View):
+        res = res.torch()
+      if self.config.debug_accuracy_for_each_op:
+        debug_accuracy(func, old_args, old_kwargs, res)
+      return res
-        if op.needs_env:
-          kwargs['env'] = self
+  def enable_torch_modes(self):
+    self._dispatch_mode.__enter__()
+    self._function_mode.__enter__()
+    self.enabled = True
+  def disable_torch_modes(self, *exc):
+    if not exc:
+      exc = (None, None, None)
+    self._function_mode.__exit__(*exc)
+    self._dispatch_mode.__exit__(*exc)
+    self.enabled = False
+  def __enter__(self):
+    self.enable_torch_modes()
+    self._manually_entered = True
+    return self
-        with self:
-          res = op.func(*args, **kwargs)
+  def __exit__(self, *exc):
+    self._manually_entered = False
+    self.disable_torch_modes(*exc)
-        if op.is_jax_function:
-          res = self.j2t_iso(res)
+  def _move_one_value(self, val):
+    if isinstance(val, torch.nn.Module):
+      with self:
+        return val.to("jax")
+    if isinstance(val, Tensor):
+      return val
+    if isinstance(val, torch.Tensor):
+      return Tensor(self.t2j_copy(val), self)
+    return val
-        if self.config.debug_accuracy_for_each_op:
-          debug_accuracy(func, old_args, old_kwargs, res)
-        return res
+  def to_xla(self, torchvalues):
+    # tensors are torch.Tensors (not XLATensor)
+    res = torch_pytree.tree_map(self._move_one_value, torchvalues)
+    return res
-    def enable_torch_modes(self):
-      self._dispatch_mode.__enter__()
-      self._function_mode.__enter__()
-      self.enabled = True
+  def t2j_iso(self, torchtensors):
+    """Convert torchax Tensor to jax array.
-    def disable_torch_modes(self, *exc):
-      if not exc:
-        exc = (None, None, None)
-      self._function_mode.__exit__(*exc)
-      self._dispatch_mode.__exit__(*exc)
-      self.enabled = False
-    def __enter__(self):
-      self.enable_torch_modes()
-      self._manually_entered = True
-      return self
-    def __exit__(self, *exc):
-      self._manually_entered = False
-      self.disable_torch_modes(*exc)
-    def _move_one_value(self, val):
-      if isinstance(val, torch.nn.Module):
-        with self:
-          return val.to('jax')
-      if isinstance(val, Tensor):
-        return val
-      if isinstance(val, torch.Tensor):
-        return Tensor(t2j(val), self)
-      return val
+    This function will not copy, will just unwrap the inner jax array out.
+    Note: iso is short for "isomorphic"
+    """
-    def to_xla(self, torchvalues):
-      # tensors are torch.Tensors (not XLATensor)
-      res = torch_pytree.tree_map(
-        self._move_one_value,
-          torchvalues)
-      return res
+    def to_jax(x):
+      if isinstance(
+          x, torch.distributed._functional_collectives.AsyncCollectiveTensor):
+        x = x.wait()
+      assert isinstance(x, Tensor) or isinstance(x, View), (
+          f"Expect a Tensor or a View but got {type(x)}; usually this means there is a mixed math between XLATensor and torch.Tensor"
+      )
+      return x.jax()
+    res = torch_pytree.tree_map_only(torch.Tensor, to_jax, torchtensors)
+    return res
-    def t2j_iso(self, torchtensors):
-      def to_jax(x):
-        if isinstance(x, torch.distributed._functional_collectives.AsyncCollectiveTensor):
-          x = x.wait()
-        assert isinstance(x, Tensor), f'Expect a Tensor but got {type(x)}; usually this means there is a mixed math between XLATensor and torch.Tensor'
-        return x.jax()
-      return torch_pytree.tree_map_only(torch.Tensor, to_jax, torchtensors)
+  def v2t_iso(self, views):
-    def j2t_iso(self, jaxarray):
-      return torch_pytree.tree_map_only(
-        jnp.ndarray, lambda x: Tensor(x, self), jaxarray)
+    def to_tensor(x):
+      if isinstance(x, View):
+        return x.torch()
+      return x
-    def j2t_copy(self, args):
-      pass
+    res = torch_pytree.tree_map_only(View, to_tensor, views)
+    return res
-    def override_op_definition(self, op_to_override, op_impl):
-      self._ops[op_to_override] = ops_registry.Operator(
+  def j2t_iso(self, jaxarray):
+    """Convert jax array to torchax Tensor.
+    This function will not copy, will just wrap the jax array with a torchax Tensor
+    Note: iso is short for "isomorphic"
+    """
+    return torch_pytree.tree_map_only(jax.Array, lambda x: Tensor(x, self),
+                                      jaxarray)
+  def j2t_copy(self, args):
+    """Convert torch.Tensor in cpu to a jax array
+    This might involves copying the data (depending if dlpack is enabled)
+    """
+    return torch_pytree.tree_map_only(
+        jax.Array,
+        lambda x: mappings.j2t(x, self.config.use_dlpack_for_data_conversion),
+        args)
+  def t2j_copy(self, args):
+    """Convert jax array to torch.Tensor in cpu.
+    This might involves copying the data (depending if dlpack is enabled)
+    """
+    return torch_pytree.tree_map_only(
+        torch.Tensor,
+        lambda x: mappings.t2j(x, self.config.use_dlpack_for_data_conversion),
+        args)
+  def override_op_definition(self, op_to_override, op_impl):
+    self._ops[op_to_override] = ops_registry.Operator(
         op_to_override,
         op_impl,
         is_jax_function=False,
         is_user_defined=True,
-        needs_env=False
-      )
+        needs_env=False,
+    )

torchax 0.0.4__py3-none-any.whl → 0.0.5__py3-none-any.whl

Potentially problematic release.

torchax 0.0.4py3-none-any.whl → 0.0.5py3-none-any.whl