PyPI - ai-edge-torch-nightly - Versions diffs - 0.3.0.dev20250114__py3-none-any.whl - Mend

ai-edge-torch-nightly 0.3.0.dev20250114__py3-none-any.whl

Files changed (213) hide show

ai_edge_torch/__init__.py +32 -0
ai_edge_torch/_config.py +69 -0
ai_edge_torch/_convert/__init__.py +14 -0
ai_edge_torch/_convert/conversion.py +153 -0
ai_edge_torch/_convert/conversion_utils.py +64 -0
ai_edge_torch/_convert/converter.py +270 -0
ai_edge_torch/_convert/fx_passes/__init__.py +23 -0
ai_edge_torch/_convert/fx_passes/build_aten_composite_pass.py +288 -0
ai_edge_torch/_convert/fx_passes/build_interpolate_composite_pass.py +131 -0
ai_edge_torch/_convert/fx_passes/inject_mlir_debuginfo_pass.py +73 -0
ai_edge_torch/_convert/fx_passes/optimize_layout_transposes_pass/__init__.py +16 -0
ai_edge_torch/_convert/fx_passes/optimize_layout_transposes_pass/layout_check.py +258 -0
ai_edge_torch/_convert/fx_passes/optimize_layout_transposes_pass/layout_mark.py +50 -0
ai_edge_torch/_convert/fx_passes/optimize_layout_transposes_pass/layout_partitioners/__init__.py +18 -0
ai_edge_torch/_convert/fx_passes/optimize_layout_transposes_pass/layout_partitioners/greedy.py +68 -0
ai_edge_torch/_convert/fx_passes/optimize_layout_transposes_pass/layout_partitioners/min_cut.py +216 -0
ai_edge_torch/_convert/fx_passes/optimize_layout_transposes_pass/layout_rewrite.py +449 -0
ai_edge_torch/_convert/fx_passes/optimize_layout_transposes_pass/op_func_registry.py +30 -0
ai_edge_torch/_convert/fx_passes/optimize_layout_transposes_pass/pass_body.py +303 -0
ai_edge_torch/_convert/fx_passes/optimize_layout_transposes_pass/utils.py +64 -0
ai_edge_torch/_convert/fx_passes/remove_non_user_outputs_pass.py +52 -0
ai_edge_torch/_convert/signature.py +66 -0
ai_edge_torch/_convert/test/__init__.py +14 -0
ai_edge_torch/_convert/test/test_convert.py +558 -0
ai_edge_torch/_convert/test/test_convert_composites.py +234 -0
ai_edge_torch/_convert/test/test_convert_multisig.py +189 -0
ai_edge_torch/_convert/test/test_to_channel_last_io.py +96 -0
ai_edge_torch/_convert/to_channel_last_io.py +92 -0
ai_edge_torch/conftest.py +20 -0
ai_edge_torch/debug/__init__.py +17 -0
ai_edge_torch/debug/culprit.py +496 -0
ai_edge_torch/debug/test/__init__.py +14 -0
ai_edge_torch/debug/test/test_culprit.py +140 -0
ai_edge_torch/debug/test/test_search_model.py +51 -0
ai_edge_torch/debug/utils.py +59 -0
ai_edge_torch/experimental/__init__.py +14 -0
ai_edge_torch/fx_pass_base.py +110 -0
ai_edge_torch/generative/__init__.py +14 -0
ai_edge_torch/generative/examples/__init__.py +14 -0
ai_edge_torch/generative/examples/amd_llama_135m/__init__.py +14 -0
ai_edge_torch/generative/examples/amd_llama_135m/amd_llama_135m.py +87 -0
ai_edge_torch/generative/examples/amd_llama_135m/convert_to_tflite.py +70 -0
ai_edge_torch/generative/examples/amd_llama_135m/verify.py +72 -0
ai_edge_torch/generative/examples/gemma/__init__.py +14 -0
ai_edge_torch/generative/examples/gemma/convert_gemma1_to_tflite.py +80 -0
ai_edge_torch/generative/examples/gemma/convert_gemma2_to_tflite.py +80 -0
ai_edge_torch/generative/examples/gemma/gemma1.py +107 -0
ai_edge_torch/generative/examples/gemma/gemma2.py +295 -0
ai_edge_torch/generative/examples/gemma/verify_gemma1.py +56 -0
ai_edge_torch/generative/examples/gemma/verify_gemma2.py +43 -0
ai_edge_torch/generative/examples/gemma/verify_util.py +157 -0
ai_edge_torch/generative/examples/llama/__init__.py +14 -0
ai_edge_torch/generative/examples/llama/convert_to_tflite.py +91 -0
ai_edge_torch/generative/examples/llama/llama.py +196 -0
ai_edge_torch/generative/examples/llama/verify.py +88 -0
ai_edge_torch/generative/examples/moonshine/__init__.py +14 -0
ai_edge_torch/generative/examples/moonshine/convert_moonshine_to_tflite.py +50 -0
ai_edge_torch/generative/examples/moonshine/moonshine.py +103 -0
ai_edge_torch/generative/examples/openelm/__init__.py +14 -0
ai_edge_torch/generative/examples/openelm/convert_to_tflite.py +80 -0
ai_edge_torch/generative/examples/openelm/openelm.py +127 -0
ai_edge_torch/generative/examples/openelm/verify.py +71 -0
ai_edge_torch/generative/examples/paligemma/__init__.py +14 -0
ai_edge_torch/generative/examples/paligemma/convert_to_tflite.py +95 -0
ai_edge_torch/generative/examples/paligemma/decoder.py +151 -0
ai_edge_torch/generative/examples/paligemma/decoder2.py +177 -0
ai_edge_torch/generative/examples/paligemma/image_encoder.py +160 -0
ai_edge_torch/generative/examples/paligemma/paligemma.py +179 -0
ai_edge_torch/generative/examples/paligemma/verify.py +161 -0
ai_edge_torch/generative/examples/paligemma/verify_decoder.py +75 -0
ai_edge_torch/generative/examples/paligemma/verify_decoder2.py +72 -0
ai_edge_torch/generative/examples/paligemma/verify_image_encoder.py +99 -0
ai_edge_torch/generative/examples/phi/__init__.py +14 -0
ai_edge_torch/generative/examples/phi/convert_phi3_to_tflite.py +80 -0
ai_edge_torch/generative/examples/phi/convert_to_tflite.py +80 -0
ai_edge_torch/generative/examples/phi/phi2.py +107 -0
ai_edge_torch/generative/examples/phi/phi3.py +219 -0
ai_edge_torch/generative/examples/phi/verify.py +64 -0
ai_edge_torch/generative/examples/phi/verify_phi3.py +69 -0
ai_edge_torch/generative/examples/qwen/__init__.py +14 -0
ai_edge_torch/generative/examples/qwen/convert_to_tflite.py +93 -0
ai_edge_torch/generative/examples/qwen/qwen.py +134 -0
ai_edge_torch/generative/examples/qwen/verify.py +88 -0
ai_edge_torch/generative/examples/smollm/__init__.py +14 -0
ai_edge_torch/generative/examples/smollm/convert_to_tflite.py +80 -0
ai_edge_torch/generative/examples/smollm/convert_v2_to_tflite.py +71 -0
ai_edge_torch/generative/examples/smollm/smollm.py +125 -0
ai_edge_torch/generative/examples/smollm/verify.py +86 -0
ai_edge_torch/generative/examples/stable_diffusion/__init__.py +14 -0
ai_edge_torch/generative/examples/stable_diffusion/attention.py +108 -0
ai_edge_torch/generative/examples/stable_diffusion/clip.py +185 -0
ai_edge_torch/generative/examples/stable_diffusion/convert_to_tflite.py +173 -0
ai_edge_torch/generative/examples/stable_diffusion/decoder.py +398 -0
ai_edge_torch/generative/examples/stable_diffusion/diffusion.py +749 -0
ai_edge_torch/generative/examples/stable_diffusion/encoder.py +119 -0
ai_edge_torch/generative/examples/stable_diffusion/pipeline.py +254 -0
ai_edge_torch/generative/examples/stable_diffusion/samplers/__init__.py +19 -0
ai_edge_torch/generative/examples/stable_diffusion/samplers/k_euler.py +62 -0
ai_edge_torch/generative/examples/stable_diffusion/samplers/k_euler_ancestral.py +66 -0
ai_edge_torch/generative/examples/stable_diffusion/samplers/k_lms.py +74 -0
ai_edge_torch/generative/examples/stable_diffusion/samplers/sampler.py +39 -0
ai_edge_torch/generative/examples/stable_diffusion/tokenizer.py +111 -0
ai_edge_torch/generative/examples/stable_diffusion/util.py +77 -0
ai_edge_torch/generative/examples/t5/__init__.py +14 -0
ai_edge_torch/generative/examples/t5/convert_to_tflite.py +138 -0
ai_edge_torch/generative/examples/t5/t5.py +655 -0
ai_edge_torch/generative/examples/t5/t5_attention.py +246 -0
ai_edge_torch/generative/examples/test_models/__init__.py +14 -0
ai_edge_torch/generative/examples/test_models/convert_toy_model.py +105 -0
ai_edge_torch/generative/examples/test_models/toy_model.py +156 -0
ai_edge_torch/generative/examples/test_models/toy_model_with_kv_cache.py +138 -0
ai_edge_torch/generative/examples/tiny_llama/__init__.py +14 -0
ai_edge_torch/generative/examples/tiny_llama/convert_to_tflite.py +80 -0
ai_edge_torch/generative/examples/tiny_llama/tiny_llama.py +88 -0
ai_edge_torch/generative/examples/tiny_llama/verify.py +72 -0
ai_edge_torch/generative/fx_passes/__init__.py +30 -0
ai_edge_torch/generative/fx_passes/remove_sdpa_zero_mask_pass.py +50 -0
ai_edge_torch/generative/layers/__init__.py +14 -0
ai_edge_torch/generative/layers/attention.py +399 -0
ai_edge_torch/generative/layers/attention_utils.py +210 -0
ai_edge_torch/generative/layers/builder.py +160 -0
ai_edge_torch/generative/layers/feed_forward.py +120 -0
ai_edge_torch/generative/layers/kv_cache.py +204 -0
ai_edge_torch/generative/layers/lora.py +557 -0
ai_edge_torch/generative/layers/model_config.py +238 -0
ai_edge_torch/generative/layers/normalization.py +222 -0
ai_edge_torch/generative/layers/rotary_position_embedding.py +94 -0
ai_edge_torch/generative/layers/scaled_dot_product_attention.py +144 -0
ai_edge_torch/generative/layers/unet/__init__.py +14 -0
ai_edge_torch/generative/layers/unet/blocks_2d.py +806 -0
ai_edge_torch/generative/layers/unet/builder.py +50 -0
ai_edge_torch/generative/layers/unet/model_config.py +282 -0
ai_edge_torch/generative/quantize/__init__.py +14 -0
ai_edge_torch/generative/quantize/example.py +47 -0
ai_edge_torch/generative/quantize/quant_attrs.py +68 -0
ai_edge_torch/generative/quantize/quant_recipe.py +154 -0
ai_edge_torch/generative/quantize/quant_recipe_utils.py +62 -0
ai_edge_torch/generative/quantize/quant_recipes.py +56 -0
ai_edge_torch/generative/quantize/supported_schemes.py +32 -0
ai_edge_torch/generative/test/__init__.py +14 -0
ai_edge_torch/generative/test/test_custom_dus.py +107 -0
ai_edge_torch/generative/test/test_kv_cache.py +120 -0
ai_edge_torch/generative/test/test_loader.py +83 -0
ai_edge_torch/generative/test/test_lora.py +147 -0
ai_edge_torch/generative/test/test_model_conversion.py +191 -0
ai_edge_torch/generative/test/test_model_conversion_large.py +362 -0
ai_edge_torch/generative/test/test_quantize.py +183 -0
ai_edge_torch/generative/test/utils.py +82 -0
ai_edge_torch/generative/utilities/__init__.py +15 -0
ai_edge_torch/generative/utilities/converter.py +215 -0
ai_edge_torch/generative/utilities/dynamic_update_slice.py +56 -0
ai_edge_torch/generative/utilities/loader.py +398 -0
ai_edge_torch/generative/utilities/model_builder.py +180 -0
ai_edge_torch/generative/utilities/moonshine_loader.py +154 -0
ai_edge_torch/generative/utilities/stable_diffusion_loader.py +1032 -0
ai_edge_torch/generative/utilities/t5_loader.py +512 -0
ai_edge_torch/generative/utilities/transformers_verifier.py +42 -0
ai_edge_torch/generative/utilities/verifier.py +335 -0
ai_edge_torch/hlfb/__init__.py +16 -0
ai_edge_torch/hlfb/mark_pattern/__init__.py +153 -0
ai_edge_torch/hlfb/mark_pattern/fx_utils.py +69 -0
ai_edge_torch/hlfb/mark_pattern/pattern.py +288 -0
ai_edge_torch/hlfb/test/__init__.py +14 -0
ai_edge_torch/hlfb/test/test_mark_pattern.py +185 -0
ai_edge_torch/lowertools/__init__.py +18 -0
ai_edge_torch/lowertools/_shim.py +86 -0
ai_edge_torch/lowertools/common_utils.py +142 -0
ai_edge_torch/lowertools/odml_torch_utils.py +260 -0
ai_edge_torch/lowertools/test_utils.py +62 -0
ai_edge_torch/lowertools/torch_xla_utils.py +301 -0
ai_edge_torch/lowertools/translate_recipe.py +163 -0
ai_edge_torch/model.py +177 -0
ai_edge_torch/odml_torch/__init__.py +20 -0
ai_edge_torch/odml_torch/_torch_future.py +88 -0
ai_edge_torch/odml_torch/_torch_library.py +19 -0
ai_edge_torch/odml_torch/composite/__init__.py +16 -0
ai_edge_torch/odml_torch/composite/mark_tensor.py +120 -0
ai_edge_torch/odml_torch/composite/stablehlo_composite_builder.py +106 -0
ai_edge_torch/odml_torch/debuginfo/__init__.py +16 -0
ai_edge_torch/odml_torch/debuginfo/_build.py +43 -0
ai_edge_torch/odml_torch/debuginfo/_op_polyfill.py +55 -0
ai_edge_torch/odml_torch/export.py +403 -0
ai_edge_torch/odml_torch/export_utils.py +157 -0
ai_edge_torch/odml_torch/jax_bridge/__init__.py +18 -0
ai_edge_torch/odml_torch/jax_bridge/_wrap.py +180 -0
ai_edge_torch/odml_torch/jax_bridge/utils.py +75 -0
ai_edge_torch/odml_torch/lowerings/__init__.py +27 -0
ai_edge_torch/odml_torch/lowerings/_basic.py +294 -0
ai_edge_torch/odml_torch/lowerings/_batch_norm.py +65 -0
ai_edge_torch/odml_torch/lowerings/_convolution.py +243 -0
ai_edge_torch/odml_torch/lowerings/_jax_lowerings.py +285 -0
ai_edge_torch/odml_torch/lowerings/_layer_norm.py +87 -0
ai_edge_torch/odml_torch/lowerings/_quantized_decomposed.py +177 -0
ai_edge_torch/odml_torch/lowerings/_rand.py +142 -0
ai_edge_torch/odml_torch/lowerings/context.py +42 -0
ai_edge_torch/odml_torch/lowerings/decomp.py +69 -0
ai_edge_torch/odml_torch/lowerings/registry.py +65 -0
ai_edge_torch/odml_torch/lowerings/utils.py +201 -0
ai_edge_torch/odml_torch/passes/__init__.py +38 -0
ai_edge_torch/odml_torch/tf_integration.py +156 -0
ai_edge_torch/quantize/__init__.py +16 -0
ai_edge_torch/quantize/pt2e_quantizer.py +466 -0
ai_edge_torch/quantize/pt2e_quantizer_utils.py +1061 -0
ai_edge_torch/quantize/quant_config.py +85 -0
ai_edge_torch/testing/__init__.py +14 -0
ai_edge_torch/testing/model_coverage/__init__.py +16 -0
ai_edge_torch/testing/model_coverage/model_coverage.py +145 -0
ai_edge_torch/version.py +16 -0
ai_edge_torch_nightly-0.3.0.dev20250114.dist-info/LICENSE +202 -0
ai_edge_torch_nightly-0.3.0.dev20250114.dist-info/METADATA +44 -0
ai_edge_torch_nightly-0.3.0.dev20250114.dist-info/RECORD +213 -0
ai_edge_torch_nightly-0.3.0.dev20250114.dist-info/WHEEL +5 -0
ai_edge_torch_nightly-0.3.0.dev20250114.dist-info/top_level.txt +1 -0

ai_edge_torch/debug/culprit.py ADDED Viewed

@@ -0,0 +1,496 @@
+# Copyright 2024 The AI Edge Torch Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Culprit finder for AI Edge Torch conversion."""
+import contextlib
+import copy
+import dataclasses
+import functools
+import io
+import operator
+import os
+from typing import Any, Callable, Generator, List, Optional, Tuple, Union
+import ai_edge_torch
+from ai_edge_torch.debug import utils
+import torch
+from torch._functorch import aot_autograd
+from torch._functorch.fx_minifier import minifier as fx_minifier
+import torch.utils._pytree as pytree
+_torch_float_dtypes = {
+    torch.float32,
+    torch.float,
+    torch.float64,
+    torch.double,
+    torch.float16,
+    torch.half,
+    torch.bfloat16,
+}
+_torch_int_dtypes = {
+    torch.uint8,
+    torch.int8,
+    torch.int16,
+    torch.short,
+    torch.int32,
+    torch.int,
+    torch.int64,
+    torch.long,
+}
+_fx_op_runner = {
+    "call_function": lambda target, args, kwargs: target(*args, **kwargs),
+    "call_method": lambda target, args, kwargs: getattr(args[0], target)(
+        *args[1:], **kwargs
+    ),
+}
+_CULPRIT_GRAPH_MODULE_NAME = "CulpritGraphModule"
+def _get_shape_str(t: torch.Tensor):
+  return f"({', '.join(map(str, t.shape))},)"
+def _tensor_to_random_tensor_call(t: torch.Tensor):
+  shape_str = _get_shape_str(t)
+  if t.dtype in _torch_float_dtypes:
+    return f"torch.randn({shape_str}, dtype={t.dtype})"
+  elif t.dtype in _torch_int_dtypes:
+    return f"torch.randint(0, 10, {shape_str}, dtype={t.dtype})"
+  elif t.dtype == torch.bool:
+    return f"torch.randint(0, 2, {shape_str}, dtype={t.dtype})"
+  else:
+    raise ValueError(f"Unsupported dtype: {t.dtype}")
+def _tensor_to_buffer(t: torch.Tensor):
+  buff = io.BytesIO()
+  torch.save(t, buff)
+  buff.seek(0)
+  return buff.read()
+@dataclasses.dataclass
+class SearchResult:
+  graph_module: torch.fx.GraphModule
+  inputs: Tuple[Any]
+  @property
+  def graph(self) -> torch.fx.Graph:
+    return self.graph_module.graph
+  @graph.setter
+  def graph(self, fx_g: torch.fx.Graph):
+    self.graph_module.graph = fx_g
+@dataclasses.dataclass
+class Culprit(SearchResult):
+  _runtime_errors: bool
+  @property
+  def stack_traces(self) -> List[str]:
+    stack_traces = set()
+    for node in self.graph.nodes:
+      if node.op.startswith("call_") and "stack_trace" in node.meta:
+        stack_traces.add(node.meta["stack_trace"])
+    return list(stack_traces)
+  def print_readable(self, print_output=True):
+    """Print the Python code for culprit graph module and sample args.
+    Args:
+      print_output: bool - If true, prints the code to stdout. Otherwise returns
+        the code in a str.
+    """
+    # TODO: b/321263453 - Support Python code gen with sample arg tensor values.
+    random_inputs = True
+    graph_module_code = self.graph_module.print_readable(
+        print_output=False
+    ).rstrip()
+    input_strs = []
+    for value in self.inputs:
+      if torch.is_tensor(value):
+        if not random_inputs:
+          input_strs.append(
+              f"# size={_get_shape_str(value)}, dtype={value.dtype}"
+          )
+          input_strs.append(
+              f"torch.load(io.BytesIO({_tensor_to_buffer(value)})),"
+          )
+        else:
+          input_strs.append(_tensor_to_random_tensor_call(value) + ",")
+      else:
+        input_strs.append(str(value) + ",")
+    inputs_code = (
+        "_args = (\n"
+        + "\n".join([" " * 4 + code for code in input_strs])
+        + "\n)"
+    )
+    code = graph_module_code + "\n\n" + inputs_code
+    if print_output:
+      print(code)
+    else:
+      return code
+  def print_code(self, print_output=True):
+    """Print the Python code for culprit graph module, sample args, and AI
+    Edge Torch conversion that will fail with the error.
+    Args:
+      print_output: bool - If true, prints the code to stdout. Otherwise returns
+        the code in a str.
+    """
+    definitions = self.print_readable(print_output=False)
+    code = (
+        "import torch\n"
+        + "from torch import device\n"
+        + "import ai_edge_torch\n\n"
+        + definitions
+        + "\n\n_edge_model ="
+        f" ai_edge_torch.convert({_CULPRIT_GRAPH_MODULE_NAME}().eval(),"
+        " _args)\n"
+    )
+    if self._runtime_errors:
+      code += "_edge_model(*_args)\n"
+    if print_output:
+      print(code)
+    else:
+      return code
+  @property
+  def code(self):
+    return self.print_code(print_output=False)
+  def __repr__(self):
+    return self.print_readable(print_output=False)
+  def __str__(self):
+    return self.print_readable(print_output=False)
+def _normalize_getitem_nodes(fx_gm: torch.fx.GraphModule):
+  """This function turns all operator getitem nodes in ExportedProgram FX graph to
+  new nodes composed of "computation + getitem". The normalization duplicates
+  some computations in the graph but would make the graph more friendly for
+  partitioning in FX minifier.
+  """
+  fx_gm = copy.deepcopy(fx_gm)
+  graph = fx_gm.graph
+  for n in graph.nodes:
+    if n.target != operator.getitem:
+      continue
+    src_n, key = n.args
+    if src_n.op not in _fx_op_runner:
+      continue
+    runner = _fx_op_runner.get(src_n.op)
+    with graph.inserting_after(n):
+      new_n = graph.call_function(
+          lambda src_target, key, args, kwargs: operator.getitem(
+              runner(src_target, args, kwargs), key
+          ),
+          (src_n.target, key, src_n.args, src_n.kwargs),
+      )
+      n.replace_all_uses_with(new_n)
+  graph.eliminate_dead_code()
+  fx_gm.graph = graph
+  return fx_gm
+def _erase_unused_inputs(
+    fx_gm: torch.fx.GraphModule, inputs: Tuple[torch.Tensor]
+):
+  fx_gm = copy.deepcopy(fx_gm)
+  inputs = tuple(inputs)
+  args = fx_gm.graph.process_inputs(*inputs)
+  args_iter = iter(args)
+  graph = fx_gm.graph
+  new_inputs = []
+  for n in graph.nodes:
+    if n.op == "placeholder":
+      if n.target.startswith("*"):
+        new_inputs += list(args_iter)
+      elif len(n.users) > 0:
+        new_inputs.append(next(args_iter))
+      else:
+        graph.erase_node(n)
+        next(args_iter)
+  new_inputs = tuple(new_inputs)
+  fx_gm.graph = graph
+  return fx_gm, new_inputs
+def _lift_dead_ops_to_outputs(fx_gm: torch.fx.GraphModule):
+  fx_gm = copy.deepcopy(fx_gm)
+  new_outputs = []
+  graph = fx_gm.graph
+  nodes = list(graph.nodes)
+  assert nodes[-1].op == "output" and sum(n.op == "output" for n in nodes) == 1
+  for node in nodes:
+    if node.op not in ("placeholder", "output") and len(node.users) == 0:
+      new_outputs.append(node)
+  output_node = nodes[-1]
+  # FX output node returns the first arg as is.
+  # ref: https://github.com/pytorch/pytorch/blob/1a578df57cc0f417f671634e564c62ef5d9a97e2/torch/fx/interpreter.py#L337
+  new_outputs, _ = pytree.tree_flatten([new_outputs, output_node.args[0]])
+  output_node.update_arg(0, tuple(new_outputs))
+  fx_gm.graph = graph
+  return fx_gm
+def _erase_trivial_outputs(fx_gm: torch.fx.GraphModule):
+  """Remove output nodes directly connected to an input node."""
+  fx_gm = copy.deepcopy(fx_gm)
+  graph = fx_gm.graph
+  nodes = list(graph.nodes)
+  assert nodes[-1].op == "output" and sum(n.op == "output" for n in nodes) == 1
+  output_node = nodes[-1]
+  outputs, _ = pytree.tree_flatten(output_node.args[0])
+  new_outputs = [output for output in outputs if output.op != "placeholder"]
+  output_node.update_arg(0, tuple(new_outputs))
+  fx_gm.recompile()
+  return fx_gm
+def _erase_sub_gm_from_gm(
+    fx_gm: torch.fx.GraphModule,
+    fx_inputs: Tuple[torch.Tensor],
+    sub_gm: torch.fx.GraphModule,
+    sub_inputs: Tuple[torch.Tensor],
+):
+  fx_gm = copy.deepcopy(fx_gm)
+  fx_inputs = list(fx_inputs)
+  class EraseNodeInterpreter(torch.fx.Interpreter):
+    def run_node(self, node):
+      nonlocal fx_gm, fx_inputs
+      res = super().run_node(node)
+      if node.op not in ("placeholder", "output"):
+        to_erase = next(m for m in fx_gm.graph.nodes if m.name == node.name)
+        # Raise the output (tensor) of the erased node to be an input of
+        # the new model graph. Some raised inputs may become unused later
+        # when all the users are within the erased subgraph, those inputs
+        # will be removed by the followed `_erase_unused_inputs` pass.
+        with fx_gm.graph.inserting_before(to_erase):
+          new_input = fx_gm.graph.placeholder(node.name + "__value")
+        to_erase.replace_all_uses_with(new_input)
+        fx_gm.graph.erase_node(to_erase)
+        fx_inputs.append(res)
+      return res
+  interpreter = EraseNodeInterpreter(sub_gm)
+  interpreter.run(*sub_inputs)
+  fx_gm.graph.lint()
+  fx_gm.recompile()
+  # Ops prior to the erased subgraph may be dangling. Lift them as outputs.
+  fx_gm = _lift_dead_ops_to_outputs(fx_gm)
+  fx_gm = _erase_trivial_outputs(fx_gm)
+  fx_gm, fx_inputs = _erase_unused_inputs(fx_gm, fx_inputs)
+  fx_gm.graph.lint()
+  fx_gm.recompile()
+  return fx_gm, fx_inputs
+def _normalize_minified_fx_gm(
+    fx_gm: torch.fx.GraphModule, inputs: Tuple[torch.Tensor]
+):
+  fx_gm, inputs = _erase_unused_inputs(fx_gm, inputs)
+  fx_gm = _lift_dead_ops_to_outputs(fx_gm)
+  fx_gm, _ = aot_autograd.aot_export_module(fx_gm, inputs, trace_joint=False)
+  fx_gm.__class__.__name__ = _CULPRIT_GRAPH_MODULE_NAME
+  return fx_gm, inputs
+def _fx_minifier_checker(fx_gm, inputs, runtime_errors=False):
+  fx_gm, inputs = _normalize_minified_fx_gm(fx_gm, inputs)
+  trivial_aten_ops = {
+      torch.ops.aten.view,
+      torch.ops.aten.view.default,
+  }
+  if all(
+      node.op in ("placeholder", "output") or node.target in trivial_aten_ops
+      for node in fx_gm.graph.nodes
+  ):
+    return False
+  try:
+    edge_model = ai_edge_torch.convert(fx_gm.eval(), inputs)
+    if runtime_errors:
+      edge_model(*inputs)
+  except Exception as err:
+    return True
+  return False
+def _search_model(
+    predicate_f: Callable[[torch.fx.GraphModule, List[Any]], bool],
+    model: Union[torch.export.ExportedProgram, torch.nn.Module],
+    export_args: Tuple[Any] = None,
+    *,
+    max_granularity: Optional[int] = None,
+    enable_fx_minifier_logging: bool = False,
+) -> Generator[SearchResult, None, None]:
+  """Finds subgraphs in the torch model that satify a certain predicate function provided by the users.
+  Args:
+    predicate_f: a predicate function the users specify. It takes a FX
+      (sub)graph and the inputs to this graph, return True if the graph
+      satisfies the predicate, return False otherwise.
+    model: model in which to search subgraph.
+    export_args: A set of args to trace the model with, i.e. model(*args) must
+      run. max_granularity - FX minifier arg. The maximum granularity (number of
+      nodes) in the returned ATen FX subgraph of the culprit.
+    enable_fx_minifier_logging: If true, allows the underlying FX minifier to
+      log the progress.
+  """
+  if isinstance(model, torch.nn.Module):
+    try:
+      ep = torch.export.export(model, export_args)
+    except Exception as err:
+      raise ValueError(
+          "Your model is not exportable by torch.export.export. Please modify"
+          " your model to be torch-exportable first."
+      ) from err
+  else:
+    ep = model
+  fx_gm, fx_inputs = utils.exported_program_to_fx_graph_module_and_inputs(ep)
+  fx_gm = _normalize_getitem_nodes(fx_gm)
+  # HACK: temporarily disable XLA_HLO_DEBUG and create_minified_hlo_graph so that
+  # fx_minifier won't dump intermediate stablehlo files to storage.
+  # https://github.com/pytorch/pytorch/blob/main/torch/_functorch/fx_minifier.py#L440
+  @contextlib.contextmanager
+  def disable_minifier_xla_debug():
+    xla_hlo_debug_value = None
+    if "XLA_HLO_DEBUG" in os.environ:
+      xla_hlo_debug_value = os.environ["XLA_HLO_DEBUG"]
+      del os.environ["XLA_HLO_DEBUG"]
+    create_minified_hlo_graph = (
+        torch._functorch.fx_minifier.create_minified_hlo_graph
+    )
+    torch._functorch.fx_minifier.create_minified_hlo_graph = (
+        lambda *args, **kwargs: None
+    )
+    try:
+      yield
+    finally:
+      if xla_hlo_debug_value is not None:
+        os.environ["XLA_HLO_DEBUG"] = xla_hlo_debug_value
+      torch._functorch.fx_minifier.create_minified_hlo_graph = (
+          create_minified_hlo_graph
+      )
+  found_culprits_num = 0
+  while True:
+    try:
+      with disable_minifier_xla_debug(), open(os.devnull, "w") as devnull:
+        with contextlib.nullcontext() if enable_fx_minifier_logging else utils.redirect_stdio(
+            stdout=devnull,
+            stderr=devnull,
+        ):
+          raw_min_fx_gm, raw_min_inputs = fx_minifier(
+              fx_gm,
+              fx_inputs,
+              predicate_f,
+              max_granularity=max_granularity,
+          )
+      min_fx_gm, min_inputs = _normalize_minified_fx_gm(
+          raw_min_fx_gm, raw_min_inputs
+      )
+      found_culprits_num += 1
+      yield SearchResult(min_fx_gm, min_inputs)
+      fx_gm, fx_inputs = _erase_sub_gm_from_gm(
+          fx_gm, fx_inputs, raw_min_fx_gm, raw_min_inputs
+      )
+    except RuntimeError as e:
+      if (
+          str(e) == "Input graph did not fail the tester"
+          and found_culprits_num > 0
+      ):
+        break
+      raise e
+def find_culprits(
+    torch_model: torch.nn.Module,
+    args: Tuple[Any],
+    max_granularity: Optional[int] = None,
+    runtime_errors: bool = False,
+    *,
+    enable_fx_minifier_logging: bool = False,
+) -> Generator[Culprit, None, None]:
+  """Finds culprits in the AI Edge Torch model conversion.
+  Args:
+    torch_model: model to export and save
+    args: A set of args to trace the model with, i.e. torch_model(*args) must
+      run max_granularity - FX minifier arg. The maximum granularity (number of
+      nodes) in the returned ATen FX subgraph of the culprit.
+    runtime_errors: If true, find culprits for Python runtime errors with
+      converted model.
+    enable_fx_minifier_logging: If true, allows the underlying FX minifier to
+      log the progress.
+  """
+  fx_minifier_checker = functools.partial(
+      _fx_minifier_checker, runtime_errors=runtime_errors
+  )
+  for search_result in _search_model(
+      fx_minifier_checker,
+      torch_model,
+      args,
+      max_granularity=max_granularity,
+      enable_fx_minifier_logging=enable_fx_minifier_logging,
+  ):
+    yield Culprit(
+        search_result.graph_module,
+        search_result.inputs,
+        _runtime_errors=runtime_errors,
+    )

ai_edge_torch/debug/test/__init__.py ADDED Viewed

@@ -0,0 +1,14 @@
+# Copyright 2024 The AI Edge Torch Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================

ai_edge_torch/debug/test/test_culprit.py ADDED Viewed

@@ -0,0 +1,140 @@
+# Copyright 2024 The AI Edge Torch Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+import ast
+import ai_edge_torch.debug
+import torch
+from absl.testing import absltest as googletest
+find_culprits = ai_edge_torch.debug.find_culprits
+_test_culprit_lib = torch.library.Library("test_culprit", "DEF")
+_test_culprit_lib.define("non_lowerable_op(Tensor x) -> Tensor")
+@torch.library.impl(
+    _test_culprit_lib, "non_lowerable_op", "CompositeExplicitAutograd"
+)
+def non_lowerable_op(x):
+  if x.max() > 10.0:
+    return x + 1.0
+  return x
+@torch.library.impl(_test_culprit_lib, "non_lowerable_op", "Meta")
+def non_lowerable_op_meta(x):
+  return torch.empty_like(x)
+class BadModel(torch.nn.Module):
+  def forward(self, x):
+    x = x + 1
+    x = torch.ops.test_culprit.non_lowerable_op.default(x)
+    return x
+class TestCulprit(googletest.TestCase):
+  def setUp(self):
+    super().setUp()
+    torch.manual_seed(0)
+    torch._dynamo.reset()
+  def test_find_culprits(self):
+    model = BadModel().eval()
+    args = (torch.rand(10),)
+    culprits = list(find_culprits(model, args))
+    self.assertEqual(len(culprits), 1)
+    self.assertIn(
+        torch.ops.test_culprit.non_lowerable_op.default,
+        [n.target for n in culprits[0].graph.nodes],
+    )
+  def test_valid_culprit_readable(self):
+    model = BadModel().eval()
+    args = (torch.rand(10),)
+    culprits = list(find_culprits(model, args))
+    self.assertEqual(len(culprits), 1)
+    code = culprits[0].print_readable(print_output=False)
+    # The code should be a valid Python code
+    ast.parse(code)
+  def test_valid_culprit_code(self):
+    model = BadModel().eval()
+    args = (torch.rand(10),)
+    culprits = list(find_culprits(model, args))
+    self.assertEqual(len(culprits), 1)
+    code = culprits[0].print_code(print_output=False)
+    # The code should be a valid Python code
+    ast.parse(code)
+  def test_find_multiple_culprits(self):
+    class MultiBadOpsModel(torch.nn.Module):
+      def forward(self, x):
+        x = x + 1
+        a = torch.ops.test_culprit.non_lowerable_op.default(x)
+        b = torch.ops.test_culprit.non_lowerable_op.default(x)
+        c = a + b
+        d = torch.ops.test_culprit.non_lowerable_op.default(c)
+        return d
+    model = MultiBadOpsModel().eval()
+    args = (torch.rand(10),)
+    culprits = list(find_culprits(model, args))
+    self.assertEqual(len(culprits), 3)
+    for culprit in culprits:
+      self.assertIn(
+          torch.ops.test_culprit.non_lowerable_op.default,
+          [n.target for n in culprit.graph.nodes],
+      )
+  def test_find_culprits_with_trivial_inputs_outputs(self):
+    class MultiBadOpsModel(torch.nn.Module):
+      def forward(self, x, y, z):
+        x = x + 1
+        a = torch.ops.test_culprit.non_lowerable_op.default(x)
+        b = torch.ops.test_culprit.non_lowerable_op.default(y)
+        return a, b, x, y, a, b
+    model = MultiBadOpsModel().eval()
+    args = (torch.rand(10), torch.rand(10), torch.rand(10))
+    culprits = list(find_culprits(model, args))
+    self.assertEqual(len(culprits), 2)
+    for culprit in culprits:
+      self.assertIn(
+          torch.ops.test_culprit.non_lowerable_op.default,
+          [n.target for n in culprit.graph.nodes],
+      )
+if __name__ == "__main__":
+  googletest.main()

ai_edge_torch/debug/test/test_search_model.py ADDED Viewed

@@ -0,0 +1,51 @@
+# Copyright 2024 The AI Edge Torch Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Tests for search_model."""
+from ai_edge_torch.debug import _search_model
+import torch
+from absl.testing import absltest as googletest
+class TestSearchModel(googletest.TestCase):
+  def test_search_model_with_ops(self):
+    class MultipleOpsModel(torch.nn.Module):
+      def forward(self, x: torch.Tensor, y: torch.Tensor) -> torch.Tensor:
+        sub_0 = x - 1
+        add_0 = y + 1
+        mul_0 = x * y
+        add_1 = sub_0 + add_0
+        mul_1 = add_0 * mul_0
+        sub_1 = add_1 - mul_1
+        return sub_1
+    model = MultipleOpsModel().eval()
+    args = (torch.rand(10), torch.rand(10))
+    def find_subgraph_with_sub(fx_gm, inputs):
+      return torch.ops.aten.sub.Tensor in [n.target for n in fx_gm.graph.nodes]
+    results = list(_search_model(find_subgraph_with_sub, model, args))
+    self.assertEqual(len(results), 2)
+    self.assertIn(
+        torch.ops.aten.sub.Tensor, [n.target for n in results[0].graph.nodes]
+    )
+if __name__ == "__main__":
+  googletest.main()